Spaces:

sashtech
/

aihumanifierandgrmoform

Sleeping

App Files Files Community

sashtech commited on Sep 23, 2024

Commit

a69899f

verified ·

1 Parent(s): fe589d8

Update app.py

Browse files

Files changed (1) hide show

app.py +29 -25

app.py CHANGED Viewed

@@ -42,23 +42,19 @@ def fix_punctuation_spacing(text):
     # Split the text into words and punctuation
     words = text.split(' ')
     cleaned_words = []
-    # Define punctuation marks to check
     punctuation_marks = {',', '.', "'", '!', '?', ':'}
     for word in words:
-        # If the word ends with a punctuation mark, remove space before it
         if cleaned_words and word and word[0] in punctuation_marks:
-            cleaned_words[-1] += word  # Append punctuation to the last word
         else:
-            cleaned_words.append(word)  # Add word to the list
     return ' '.join(cleaned_words).replace(' ,', ',').replace(' .', '.').replace(" '", "'") \
                                     .replace(' !', '!').replace(' ?', '?').replace(' :', ':')
 # Function to fix possessives like "Earth's"
 def fix_possessives(text):
-    # Simple rule to catch possessives and correct spacing
     text = re.sub(r'(\w)\s\'\s?s', r"\1's", text)
     return text
@@ -70,9 +66,9 @@ def capitalize_sentences_and_nouns(text):
     for sent in doc.sents:
         sentence = []
         for token in sent:
-            if token.i == sent.start:  # First word of the sentence
                 sentence.append(token.text.capitalize())
-            elif token.pos_ == "PROPN":  # Proper noun
                 sentence.append(token.text.capitalize())
             else:
                 sentence.append(token.text)
@@ -82,14 +78,12 @@ def capitalize_sentences_and_nouns(text):
 # Function to force capitalization of the first letter of every sentence and ensure full stops
 def force_first_letter_capital(text):
-    sentences = re.split(r'(?<=\w[.!?])\s+', text)  # Split based on sentence-ending punctuation
     capitalized_sentences = []
     for sentence in sentences:
         if sentence:
-            # Capitalize the first letter if not already capitalized
             capitalized_sentence = sentence[0].capitalize() + sentence[1:]
-            # Ensure there's a full stop at the end if there's no punctuation
             if not re.search(r'[.!?]$', capitalized_sentence):
                 capitalized_sentence += '.'
             capitalized_sentences.append(capitalized_sentence)
@@ -131,9 +125,9 @@ def ensure_subject_verb_agreement(text):
     corrected_text = []
     for token in doc:
         if token.dep_ == "nsubj" and token.head.pos_ == "VERB":
-            if token.tag_ == "NN" and token.head.tag_ != "VBZ":  # Singular noun, should use singular verb
                 corrected_text.append(token.head.lemma_ + "s")
-            elif token.tag_ == "NNS" and token.head.tag_ == "VBZ":  # Plural noun, should not use singular verb
                 corrected_text.append(token.head.lemma_)
         corrected_text.append(token.text)
     return ' '.join(corrected_text)
@@ -147,31 +141,41 @@ def correct_spelling(text):
         if corrected_word is not None:
             corrected_words.append(corrected_word)
         else:
-            corrected_words.append(word)  # Keep the original word if correction is None
     return ' '.join(corrected_words)
 # Main function for paraphrasing and grammar correction
 def paraphrase_and_correct(text):
-    # Remove meaningless or redundant words first
     cleaned_text = remove_redundant_words(text)
-    # Capitalize sentences and nouns
     paraphrased_text = capitalize_sentences_and_nouns(cleaned_text)
-    # Ensure first letter of each sentence is capitalized
     paraphrased_text = force_first_letter_capital(paraphrased_text)
-    # Apply grammatical corrections
     paraphrased_text = correct_article_errors(paraphrased_text)
     paraphrased_text = correct_tense_errors(paraphrased_text)
     paraphrased_text = ensure_subject_verb_agreement(paraphrased_text)
-    # Fix punctuation spacing and possessives
     paraphrased_text = fix_possessives(paraphrased_text)
-    # Correct spelling errors
     paraphrased_text = correct_spelling(paraphrased_text)
     paraphrased_text = fix_punctuation_spacing(paraphrased_text)
     return paraphrased_text

     # Split the text into words and punctuation
     words = text.split(' ')
     cleaned_words = []
     punctuation_marks = {',', '.', "'", '!', '?', ':'}
     for word in words:
         if cleaned_words and word and word[0] in punctuation_marks:
+            cleaned_words[-1] += word
         else:
+            cleaned_words.append(word)
     return ' '.join(cleaned_words).replace(' ,', ',').replace(' .', '.').replace(" '", "'") \
                                     .replace(' !', '!').replace(' ?', '?').replace(' :', ':')
 # Function to fix possessives like "Earth's"
 def fix_possessives(text):
     text = re.sub(r'(\w)\s\'\s?s', r"\1's", text)
     return text
     for sent in doc.sents:
         sentence = []
         for token in sent:
+            if token.i == sent.start:
                 sentence.append(token.text.capitalize())
+            elif token.pos_ == "PROPN":
                 sentence.append(token.text.capitalize())
             else:
                 sentence.append(token.text)
 # Function to force capitalization of the first letter of every sentence and ensure full stops
 def force_first_letter_capital(text):
+    sentences = re.split(r'(?<=\w[.!?])\s+', text)
     capitalized_sentences = []
     for sentence in sentences:
         if sentence:
             capitalized_sentence = sentence[0].capitalize() + sentence[1:]
             if not re.search(r'[.!?]$', capitalized_sentence):
                 capitalized_sentence += '.'
             capitalized_sentences.append(capitalized_sentence)
     corrected_text = []
     for token in doc:
         if token.dep_ == "nsubj" and token.head.pos_ == "VERB":
+            if token.tag_ == "NN" and token.head.tag_ != "VBZ":
                 corrected_text.append(token.head.lemma_ + "s")
+            elif token.tag_ == "NNS" and token.head.tag_ == "VBZ":
                 corrected_text.append(token.head.lemma_)
         corrected_text.append(token.text)
     return ' '.join(corrected_text)
         if corrected_word is not None:
             corrected_words.append(corrected_word)
         else:
+            corrected_words.append(word)
     return ' '.join(corrected_words)
+# Function to replace a word with its synonym
+def replace_with_synonyms(text):
+    words = text.split()
+    replaced_words = []
+    for word in words:
+        synonyms = wordnet.synsets(word)
+        if synonyms:
+            # Take the first synonym if available
+            synonym = synonyms[0].lemmas()[0].name()
+            # Replace the word with its synonym if it's different
+            if synonym.lower() != word.lower():
+                replaced_words.append(synonym.replace('_', ' '))
+            else:
+                replaced_words.append(word)
+        else:
+            replaced_words.append(word)
+    return ' '.join(replaced_words)
 # Main function for paraphrasing and grammar correction
 def paraphrase_and_correct(text):
     cleaned_text = remove_redundant_words(text)
     paraphrased_text = capitalize_sentences_and_nouns(cleaned_text)
     paraphrased_text = force_first_letter_capital(paraphrased_text)
     paraphrased_text = correct_article_errors(paraphrased_text)
     paraphrased_text = correct_tense_errors(paraphrased_text)
     paraphrased_text = ensure_subject_verb_agreement(paraphrased_text)
     paraphrased_text = fix_possessives(paraphrased_text)
     paraphrased_text = correct_spelling(paraphrased_text)
     paraphrased_text = fix_punctuation_spacing(paraphrased_text)
+    paraphrased_text = replace_with_synonyms(paraphrased_text)  # Add synonym replacement here
     return paraphrased_text