implement scores for roberta and germanSentiment

This commit is contained in:
rnsrk 2023-01-24 21:23:37 +01:00
parent 52223192b4
commit fae306916f
2 changed files with 11 additions and 7 deletions

View file

@ -31,21 +31,25 @@ class SentiTooter:
def analyze(self, language, content):
match language:
case 'de':
sentiment = self.deModel.predict_sentiment([content])
sentiment.append('germanSentiment')
return sentiment
sentimentList, probabilitiesList = self.deModel.predict_sentiment([content], output_probabilities=True)
sentiment = sentimentList[0]
score = {i[0]: i[1] for i in probabilitiesList[0]}[sentiment]
return [sentiment, 'germanSentiment', score]
case 'en':
text = preprocess(content)
encoded_input = self.enTokenizer(text, return_tensors='pt')
output = self.enModel(**encoded_input)
scores = output[0][0].detach().numpy()
scores = softmax(scores)
print(scores)
sentimentIndexWithMaxScore = np.argmax(scores)
sentimentLabel = self.labels[sentimentIndexWithMaxScore]
sentiment = [sentimentLabel, 'twitter-roberta-base-sentiment']
sentiment = [sentimentLabel, 'twitter-roberta-base-sentiment', max(scores)]
print(sentiment)
return sentiment
case _:
compound = self.sia.polarity_scores(content)['compound']
print(self.sia.polarity_scores(content), 'vaderSentiment')
if compound > (1 / 3):
return ['positive', 'vaderSentiment']
elif compound < (-1 / 3):