exact_data2023/application/functions/sentiment.py

from transformers import AutoTokenizer
from transformers import pipeline, GPT2ForSequenceClassification
import re
from facebook_scraper import get_posts

# model = 'application/models/sentiment_model'
# tokenizer = AutoTokenizer.from_pretrained('application/tokenizers/sentiment_tokenizer')

model = GPT2ForSequenceClassification.from_pretrained("Scigi/sentiment-analysis-model", num_labels=3)
tokenizer = AutoTokenizer.from_pretrained("Scigi/sentiment-analysis-model")

def sentiment_prediction(data):
    pipe = pipeline('text-classification', model=model, tokenizer = tokenizer)
    result = pipe(data)
    return result

def clear_data(data):
    data = [re.sub(r"[^A-Za-zżźćńółęąśŻŹĆĄŚĘŁÓŃ ']+", r"", i) for i in data['sentences']]
    data = [x for x in data if x != '']
    data = [i.strip() for i in data]
    data = [i.lower() for i in data]
    return data

def count_predictions(predictions):
    l0 = 0
    l1 = 0
    l2 = 0
    all = {}

    for i in predictions:
        if i['label'] == 'LABEL_0':
            l0 += 1
        if i['label'] == 'LABEL_1':
            l1 += 1
        if i['label'] == 'LABEL_2':
            l2 += 1

    all['positive'] = l1
    all['negative'] = l0
    all['neutral'] = l2

    return all

def scrapp_comments(url):
    comments= []
    all = {}
    for post in get_posts(post_urls=[url], options={"allow_extra_requests": False, "comments":True, "extra_info":True}):
        text_post = post['text']
        for comment in post['comments_full']:
            comments.append(comment['comment_text'])
    all['post'] = text_post
    all['sentences'] = comments
    return all
sentiment analysis 2023-05-27 15:10:30 +02:00			`from transformers import AutoTokenizer`
get model and tokenizer from HuggingFace 2023-05-30 15:30:13 +02:00			`from transformers import pipeline, GPT2ForSequenceClassification`
add preprocessing of data before predicitons 2023-05-29 23:41:36 +02:00			`import re`
add scrapper for comments, endpoint for scrapping 2023-05-30 00:00:34 +02:00			`from facebook_scraper import get_posts`
sentiment analysis 2023-05-27 15:10:30 +02:00
get model and tokenizer from HuggingFace 2023-05-30 15:30:13 +02:00			`# model = 'application/models/sentiment_model'`
			`# tokenizer = AutoTokenizer.from_pretrained('application/tokenizers/sentiment_tokenizer')`

			`model = GPT2ForSequenceClassification.from_pretrained("Scigi/sentiment-analysis-model", num_labels=3)`
			`tokenizer = AutoTokenizer.from_pretrained("Scigi/sentiment-analysis-model")`
sentiment analysis 2023-05-27 15:10:30 +02:00
			`def sentiment_prediction(data):`
			`pipe = pipeline('text-classification', model=model, tokenizer = tokenizer)`
			`result = pipe(data)`
data for bar plot 2023-05-27 16:44:44 +02:00			`return result`

add preprocessing of data before predicitons 2023-05-29 23:41:36 +02:00			`def clear_data(data):`
			`data = [re.sub(r"[^A-Za-zżźćńółęąśŻŹĆĄŚĘŁÓŃ ']+", r"", i) for i in data['sentences']]`
catch exceptions from scrapper 2023-05-30 13:57:44 +02:00			`data = [x for x in data if x != '']`
add preprocessing of data before predicitons 2023-05-29 23:41:36 +02:00			`data = [i.strip() for i in data]`
			`data = [i.lower() for i in data]`
			`return data`

data for bar plot 2023-05-27 16:44:44 +02:00			`def count_predictions(predictions):`
			`l0 = 0`
			`l1 = 0`
			`l2 = 0`
			`all = {}`

			`for i in predictions:`
			`if i['label'] == 'LABEL_0':`
			`l0 += 1`
			`if i['label'] == 'LABEL_1':`
			`l1 += 1`
			`if i['label'] == 'LABEL_2':`
			`l2 += 1`

			`all['positive'] = l1`
			`all['negative'] = l0`
			`all['neutral'] = l2`

add scrapper for comments, endpoint for scrapping 2023-05-30 00:00:34 +02:00			`return all`

			`def scrapp_comments(url):`
scrapp post 2023-05-30 00:47:35 +02:00			`comments= []`
			`all = {}`
add scrapper for comments, endpoint for scrapping 2023-05-30 00:00:34 +02:00			`for post in get_posts(post_urls=[url], options={"allow_extra_requests": False, "comments":True, "extra_info":True}):`
scrapp post 2023-05-30 00:47:35 +02:00			`text_post = post['text']`
add scrapper for comments, endpoint for scrapping 2023-05-30 00:00:34 +02:00			`for comment in post['comments_full']:`
scrapp post 2023-05-30 00:47:35 +02:00			`comments.append(comment['comment_text'])`
			`all['post'] = text_post`
catch exceptions from scrapper 2023-05-30 13:57:44 +02:00			`all['sentences'] = comments`
scrapp post 2023-05-30 00:47:35 +02:00			`return all`