Spaces:

Kims12
/

1_4_keyword

Sleeping

App Files Files Community

Kims12 commited on Aug 19, 2024

Commit

46e9dda

verified ·

1 Parent(s): afd67dc

Update app.py

Browse files

Files changed (1) hide show

app.py +12 -16

app.py CHANGED Viewed

@@ -7,12 +7,9 @@ import os
 def process_excel(file):
     # 엑셀 파일 읽기
     df = pd.read_excel(file.name)
-    # 모든 셀을 아래로 3칸씩 이동
-    shifted_df = df.shift(3)
     # D열의 데이터 추출
-    product_names = shifted_df.iloc[:, 3].dropna()  # D열은 0부터 시작하므로 index는 3
     # 키워드 추출 및 빈도 계산
     all_keywords = []
@@ -31,28 +28,27 @@ def process_excel(file):
     result_df = pd.DataFrame(keyword_counts.items(), columns=['Keyword', 'Frequency'])
     result_df = result_df.sort_values(by='Frequency', ascending=False).reset_index(drop=True)
     # 디렉토리 생성 확인 및 파일 저장
     output_dir = "output"
     if not os.path.exists(output_dir):
         os.makedirs(output_dir)
-    # 결과를 저장할 파일명 설정
-    output_file_shifted = os.path.join(output_dir, "shifted_excel.xlsx")
-    output_file_keywords = os.path.join(output_dir, "keyword_counts.xlsx")
-    # 이동된 데이터프레임과 키워드 카운트 결과를 각각 저장
-    shifted_df.to_excel(output_file_shifted, index=False)
-    result_df.to_excel(output_file_keywords, index=False)
-    return [output_file_shifted, output_file_keywords]
 # Gradio 인터페이스 정의
 iface = gr.Interface(
     fn=process_excel,
     inputs=gr.File(file_types=[".xlsx"]),  # 엑셀 파일만 업로드할 수 있게 설정
-    outputs=[gr.File(label="Shifted Excel File"), gr.File(label="Keyword Counts Excel File")],
-    title="Excel Shift Rows and Keyword Extraction",
-    description="엑셀 파일의 모든 셀을 아래로 3칸씩 이동시키고, D열에서 키워드를 추출하여 빈도를 계산한 후 결과를 제공합니다."
 )
 if __name__ == "__main__":

 def process_excel(file):
     # 엑셀 파일 읽기
     df = pd.read_excel(file.name)
     # D열의 데이터 추출
+    product_names = df.iloc[:, 3].dropna()  # D열은 0부터 시작하므로 index는 3
     # 키워드 추출 및 빈도 계산
     all_keywords = []
     result_df = pd.DataFrame(keyword_counts.items(), columns=['Keyword', 'Frequency'])
     result_df = result_df.sort_values(by='Frequency', ascending=False).reset_index(drop=True)
+    # A4, B4부터 결과를 시작하도록 데이터프레임을 수정
+    result_df_shifted = pd.DataFrame(index=range(3))  # 빈 데이터프레임 생성 (3칸 아래로 이동)
+    result_df_shifted = pd.concat([result_df_shifted, result_df]).reset_index(drop=True)
     # 디렉토리 생성 확인 및 파일 저장
     output_dir = "output"
     if not os.path.exists(output_dir):
         os.makedirs(output_dir)
+    output_file = os.path.join(output_dir, "keyword_counts.xlsx")
+    result_df_shifted.to_excel(output_file, index=False, header=False, startrow=3)  # 3행에서 시작
+    return output_file
 # Gradio 인터페이스 정의
 iface = gr.Interface(
     fn=process_excel,
     inputs=gr.File(file_types=[".xlsx"]),  # 엑셀 파일만 업로드할 수 있게 설정
+    outputs="file",
+    title="Excel Keyword Extractor",
+    description="엑셀 파일의 D열에서 키워드를 추출하고 빈도를 계산하여 새로운 엑셀 파일로 출력합니다."
 )
 if __name__ == "__main__":