+++++ dataanalysis/code/data 说真的... clean.py
import pandas as pd
def cleandata:
# Read CSV file into a DataFrame
df = pd.readcsv,与君共勉。
# Drop columns with all NaN values or with only one unique value
df_cleaned = df.dropna
for column in df.columns:
if len) == 1:
df_cleaned = df_cleaned.drop
# Drop rows with all NaN values
df_cleaned = df_cleaned.dropna
# Remove any duplicate rows
#dfcleaned = df.dropduplicates,他急了。
# Save cleaned data to a new CSV file
outputfilepa 我不敢苟同... th = inputfilepath.replace
dfcleaned.tocsv
print
clean_data
+++++ dataanalysis/code/sentimentanalyzer.py
from transformers import pipeline,说句实话…
class SentimentAnalyzer:
def init:
self.sentimentpipeline = pipeline(
model='cardiffnlp/twitter-ro 什么鬼? berta-base-sentiment-latest',
functionkwargs={'device': 'cuda' if torch.cuda.is_available else 'cpu'}
)
def analyze_sentiments:
sentiments=
for text in texts:
result=self.sentiment_pipeline
label=result
if label=='LABEL_0':
label='negative'
elif label=='LABEL_1':
label='neutral'
else:
label='positive'
sentiments.append
return sentiments
+++++ web_scraper/scraper.py
import requests
from bs4 import BeautifulSoup
+++++ dataanalysis/code/data 说真的... clean.py
import pandas as pd
def cleandata:
# Read CSV file into a DataFrame
df = pd.readcsv,与君共勉。
# Drop columns with all NaN values or with only one unique value
df_cleaned = df.dropna
for column in df.columns:
if len) == 1:
df_cleaned = df_cleaned.drop
# Drop rows with all NaN values
df_cleaned = df_cleaned.dropna
# Remove any duplicate rows
#dfcleaned = df.dropduplicates,他急了。
# Save cleaned data to a new CSV file
outputfilepa 我不敢苟同... th = inputfilepath.replace
dfcleaned.tocsv
print
clean_data
+++++ dataanalysis/code/sentimentanalyzer.py
from transformers import pipeline,说句实话…
class SentimentAnalyzer:
def init:
self.sentimentpipeline = pipeline(
model='cardiffnlp/twitter-ro 什么鬼? berta-base-sentiment-latest',
functionkwargs={'device': 'cuda' if torch.cuda.is_available else 'cpu'}
)
def analyze_sentiments:
sentiments=
for text in texts:
result=self.sentiment_pipeline
label=result
if label=='LABEL_0':
label='negative'
elif label=='LABEL_1':
label='neutral'
else:
label='positive'
sentiments.append
return sentiments
+++++ web_scraper/scraper.py
import requests
from bs4 import BeautifulSoup