Spaces:

sky4432
/

Shot-Shot

Sleeping

App Files Files Community

sky4432 commited on 8 days ago

Commit

ef15b80

verified ·

1 Parent(s): 2d368ee

Update app.py

Browse files

Files changed (1) hide show

app.py +30 -69

app.py CHANGED Viewed

@@ -1,92 +1,53 @@
 import streamlit as st
-import pandas as pd
 from transformers import pipeline
-#######################################
-# 1) 모델 준비
-#######################################
-# (A) Zero-Shot 분류 파이프라인 (다국어 모델)
 topic_classifier = pipeline(
     "zero-shot-classification",
-    model="joeddav/xlm-roberta-large-xnli"
 )
-# (B) 감성분석 파이프라인 (koelectra-nsmc 예시)
 sentiment_analyzer = pipeline(
     "sentiment-analysis",
     model="monologg/koelectra-base-finetuned-nsmc"
 )
-# 분류할 주제 라벨 (HR 이슈 예시)
-topic_labels = ["근무환경", "복리후생", "급여", "평가보상", "제도", "생산라인", "조직문화", "인원충원", "기타"]
-#######################################
-# 2) Streamlit UI
-#######################################
-st.title("Employee Feedback Analyzer")
 st.write("""
-**직원 익명게시판** 등 텍스트를 업로드하여,
-- **이슈 주제**(Zero-Shot)
-- **감성분석**(긍정/부정)
-결과를 확인할 수 있는 데모입니다.
 """)
-uploaded_file = st.file_uploader("CSV 또는 XLSX 파일을 업로드하세요", type=["csv", "xlsx"])
-if uploaded_file is not None:
-    # 2-1) 파일 로드
-    if uploaded_file.name.endswith(".csv"):
-        df = pd.read_csv(uploaded_file)
     else:
-        df = pd.read_excel(uploaded_file)
-    st.write("업로드된 데이터 (최대 5행 미리보기):")
-    st.dataframe(df.head())
-    # 'content'라는 열에 게시글이 있다고 가정
-    text_column = st.selectbox("분석할 텍스트 컬럼 선택", df.columns)
-    if st.button("분석 시작"):
-        # 결과 저장 리스트
-        topics = []
-        topic_scores = []
-        sentiments = []
-        sentiment_scores = []
-        for text in df[text_column]:
-            # Zero-Shot 분류
-            # truncation=True로 글이 길어도 최대 토큰 초과 에러 방지
-            topic_result = topic_classifier(text, topic_labels, truncation=True)
-            # 가장 확률 높은 라벨
-            pred_label = topic_result["labels"][0]
-            pred_score = topic_result["scores"][0]
-            # 감성분석
-            sentiment_result = sentiment_analyzer(text, truncation=True)
-            sent_label = sentiment_result[0]["label"]
-            sent_score = sentiment_result[0]["score"]
-            topics.append(pred_label)
-            topic_scores.append(round(pred_score, 4))
-            sentiments.append(sent_label)
-            sentiment_scores.append(round(sent_score, 4))
-        # 결과를 데이터프레임에 추가
-        df["pred_topic"] = topics
-        df["topic_score"] = topic_scores
-        df["sentiment_label"] = sentiments
-        df["sentiment_score"] = sentiment_scores
-        st.write("분석 결과")
-        st.dataframe(df)
-        # 다운로드 버튼
-        csv_data = df.to_csv(index=False).encode("utf-8-sig")
-        st.download_button(
-            label="결과 CSV 다운로드",
-            data=csv_data,
-            file_name="employee_feedback_analysis.csv",
-            mime="text/csv"
-        )

 import streamlit as st
 from transformers import pipeline
+# Zero-Shot 분류 모델 (이슈주제 분류)
 topic_classifier = pipeline(
     "zero-shot-classification",
+    model="joeddav/xlm-roberta-large-xnli"  # 다국어 지원
 )
+# 감성분석 모델 (koelectra-nsmc)
 sentiment_analyzer = pipeline(
     "sentiment-analysis",
     model="monologg/koelectra-base-finetuned-nsmc"
 )
+# 정의할 주제 라벨 (예시)
+topic_labels = ["근무환경", "복리후생", "조직문화", "급여", "제도평가보상", "셍산라인", "인력충원", "기타"]
+st.title("이슈주제 + 감성분석 (복붙 버전)")
 st.write("""
+**아래 입력란에 5,000자 이하로 텍스트를 붙여넣은 뒤, '분석하기'를 눌러주세요.**
+- Zero-Shot 분류 → **근무환경 / 복리후생 / 조직문화 / 인원충원 / 기타**
+- 감성분석 → **긍정(positive) / 부정(negative)**
 """)
+# 최대 5000자 제한
+input_text = st.text_area("텍스트 입력", max_chars=5000, height=300)
+if st.button("분석하기"):
+    if len(input_text.strip()) == 0:
+        st.warning("분석할 텍스트를 입력해주세요!")
     else:
+        # 1) Zero-Shot 분류
+        topic_result = topic_classifier(
+            input_text,
+            topic_labels,
+            truncation=True  # 글자 수가 많을 때 오류 방지(512토큰 초과 시 잘라냄)
+        )
+        pred_topic = topic_result["labels"][0]
+        topic_score = topic_result["scores"][0]
+        # 2) 감성분석
+        sent_result = sentiment_analyzer(input_text, truncation=True)
+        sent_label = sent_result[0]["label"]
+        sent_score = sent_result[0]["score"]
+        st.subheader("분석 결과")
+        st.write(f"- **주제**: {pred_topic} (score={topic_score:.4f})")
+        st.write(f"- **감성**: {sent_label} (score={sent_score:.4f})")
+        st.success("분석 완료!")