handle the following issue

Louquinze · Louquinze · commit cdaeed5dec24 · 2022-02-24T10:10:22.000+01:00
automl#1373 (comment) this commit fixes the first 3 bullet points on the to do list. 1. rename hyperparameter "ngram_range" --> "ngram_upper_bound" this includes changing all *csv and *json files 2. Create a new textpreprocessing example_text_preprocessing.py, this new example features the 20Newsgroups dataset import in example_text_preprocessing.py to long, but i can not come up with a good solution include feedback from 02.24.
diff --git a/examples/40_advanced/example_text_preprocessing.py b/examples/40_advanced/example_text_preprocessing.py
@@ -1,17 +1,15 @@
 # -*- encoding: utf-8 -*-
 """
-==============
+==================
 Text preprocessing
-==============
+==================
 
 The following example shows how to fit a simple NLP problem with
 *auto-sklearn*.
 
-For deeper insights into the field of text preprocessing you can follow these links:
+For an introduction to text preprocessing you can follow these links:
     1. https://scikit-learn.org/stable/tutorial/text_analytics/working_with_text_data.html
     2. https://machinelearningmastery.com/clean-text-machine-learning-python/
-
-
 """
 from pprint import pprint
 
diff --git a/test/test_pipeline/components/data_preprocessing/test_data_preprocessing_text.py b/test/test_pipeline/components/data_preprocessing/test_data_preprocessing_text.py
@@ -2,10 +2,10 @@
 
 import numpy as np
 import pandas as pd
-from autosklearn.pipeline.components.data_preprocessing.text_encoding.bag_of_word_encoding import (
+from autosklearn.pipeline.components.data_preprocessing.text_encoding.bag_of_word_encoding import (  # noqa: E501
     BagOfWordEncoder as BOW,
 )
-from autosklearn.pipeline.components.data_preprocessing.text_encoding.bag_of_word_encoding_distinct import (
+from autosklearn.pipeline.components.data_preprocessing.text_encoding.bag_of_word_encoding_distinct import (  # noqa: E501
     BagOfWordEncoder as BOW_distinct,
 )
 

Original file line number	Diff line number	Diff line change
`@@ -2,10 +2,10 @@`
`2`	`2`
`3`	`3`	`import numpy as np`
`4`	`4`	`import pandas as pd`
`5`		`-from autosklearn.pipeline.components.data_preprocessing.text_encoding.bag_of_word_encoding import (`
	`5`	`+from autosklearn.pipeline.components.data_preprocessing.text_encoding.bag_of_word_encoding import ( # noqa: E501`
`6`	`6`	`BagOfWordEncoder as BOW,`
`7`	`7`	`)`
`8`		`-from autosklearn.pipeline.components.data_preprocessing.text_encoding.bag_of_word_encoding_distinct import (`
	`8`	`+from autosklearn.pipeline.components.data_preprocessing.text_encoding.bag_of_word_encoding_distinct import ( # noqa: E501`
`9`	`9`	`BagOfWordEncoder as BOW_distinct,`
`10`	`10`	`)`
`11`	`11`