Spaces:

FPRT
/

ThematicAnalysis

Sleeping

noequal commited on Nov 8, 2023

Commit

f9b90ad

1 Parent(s): 9626dcf

Create text_processor.py

Files changed (1) hide show

text_processor.py ADDED Viewed

+# Function for generating text based on input
+def generate_text(input_text, model, tokenizer):
+    # Append the special token to the input
+    input_text = input_text + ' [LABEL]'
+    input_ids = tokenizer.encode(input_text, return_tensors='pt')
+    attention_mask = torch.ones_like(input_ids)
+    outputs = model.generate(input_ids, attention_mask=attention_mask, max_length=len(input_ids) + 5, do_sample=True, top_p=0.95)
+    generated = tokenizer.decode(outputs[0], skip_special_tokens=False)
+    labels = generated.split(',')
+    labels = [label.replace('[LABEL]', '').strip() for label in labels]
+    return generated
+# Function for sequence classification
+def classify_text(input_text, model, tokenizer):
+    # Tokenize the input text
+    input_ids = tokenizer.encode(input_text, return_tensors='pt')
+    attention_mask = torch.ones_like(input_ids)
+    # Perform sequence classification
+    result = model(input_ids, attention_mask=attention_mask)
+    # Post-process the results (e.g., select labels based on a threshold)
+    labels = post_process_labels(result)
+    return labels