Spaces:

rodrigomasini
/

recurrentGPT

Running

rodrigomasini commited on May 24, 2024

Commit

36c019e

verified ·

1 Parent(s): a337459

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -229,26 +229,34 @@ def pre_process_text(text):
     # Split the text into sections
     sections = re.split(r'\n{2,}', text)
     # Remove empty strings from the split result
     sections = [section.strip() for section in sections if section.strip()]
     # Combine sections into a single string
-    combined_text = '\n\n'.join(sections)
-    sentences_list = re.split(r'(?<!\w\.\w.)(?<![A-Z][a-z]\.)(?<=\.|\?)\s', text)
-    print(sentences_list)
     # Split the elements of the list by newline characters
     split_sentences = []
     for sentence in sentences_list:
         split_sentences.extend(re.split(r'\n+', sentence))
     # Remove empty elements
     cleaned_sentences = [sentence for sentence in split_sentences if sentence.strip()]
-    combined_text = (" ".join(cleaned_sentences))
-    return combined_text
 def flesch_kincaid_grade_level(text):
     sentences = pre_process_text(text)

     # Split the text into sections
     sections = re.split(r'\n{2,}', text)
+    print("Sections:", sections)
     # Remove empty strings from the split result
     sections = [section.strip() for section in sections if section.strip()]
+    print("Non-empty Sections:", sections)
     # Combine sections into a single string
+    combined_text = ' '.join(sections)
+    print("Combined Text:", combined_text)
+    # Split the text into sentences
+    sentences_list = re.split(r'(?<!\w\.\w.)(?<![A-Z][a-z]\.)(?<=\.|\?)\s', combined_text)
+    print("Sentences List:", sentences_list)
     # Split the elements of the list by newline characters
     split_sentences = []
     for sentence in sentences_list:
         split_sentences.extend(re.split(r'\n+', sentence))
+    print("Split Sentences:", split_sentences)
     # Remove empty elements
     cleaned_sentences = [sentence for sentence in split_sentences if sentence.strip()]
+    print("Cleaned Sentences:", cleaned_sentences)
+    combined_cleaned_text = " ".join(cleaned_sentences)
+    print("Combined Cleaned Text:", combined_cleaned_text)
+    return combined_cleaned_text
 def flesch_kincaid_grade_level(text):
     sentences = pre_process_text(text)