Tao Wu commited on
Commit
23aeabb
β€’
1 Parent(s): 8bfe948

add BA courses

Browse files
app/app.py CHANGED
@@ -1,6 +1,5 @@
1
  import gradio as gr
2
  import pandas as pd
3
- import redis
4
  import json
5
  import requests
6
  from config import *
 
1
  import gradio as gr
2
  import pandas as pd
 
3
  import json
4
  import requests
5
  from config import *
app/config.py CHANGED
@@ -18,7 +18,7 @@ QUERY_INSTRUCTION = os.getenv('QUERY_INSTRUCTION', '')
18
  # Other configurations
19
  TOP_K = int(os.getenv('TOP_K', 10))
20
  #PERSIST_DIRECTORY = os.getenv('PERSIST_DIRECTORY', "/app/data/course_emb_db")
21
- PERSIST_DIRECTORY = os.getenv('PERSIST_DIRECTORY', "/app/data/EduGBERT_cos_escoai")
22
  CSV_FILE_PATH = os.getenv('CSV_FILE_PATH', '/app/data/occupations_de.csv')
23
 
24
  REC_LORA_MODEL = os.getenv('REC_LORA_MODEL', 'wt3639/Llama-3-8B-Instruct_CourseRec_lora')
 
18
  # Other configurations
19
  TOP_K = int(os.getenv('TOP_K', 10))
20
  #PERSIST_DIRECTORY = os.getenv('PERSIST_DIRECTORY', "/app/data/course_emb_db")
21
+ PERSIST_DIRECTORY = os.getenv('PERSIST_DIRECTORY', "/app/data/BA_Udemy_Berufe")
22
  CSV_FILE_PATH = os.getenv('CSV_FILE_PATH', '/app/data/occupations_de.csv')
23
 
24
  REC_LORA_MODEL = os.getenv('REC_LORA_MODEL', 'wt3639/Llama-3-8B-Instruct_CourseRec_lora')
app/data/{multilingual-e5_cos_escoai/c4b78092-a1fa-41fc-b6b0-8fa36ef29576 β†’ BA_Udemy_Berufe/7611ee46-6912-4fba-9d4f-830c52f852f9}/data_level0.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5febe5913f14ef4735dcb9551b6f86e9d183b2fac0a2c1ac980fee33a6443534
3
- size 25416000
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df7c8f847f4d7a01edb958af28a19d8b3c7798e70d4be95ca9f3e865e0e81b50
3
+ size 93192000
app/data/{multilingual-e5_cos_escoai/c4b78092-a1fa-41fc-b6b0-8fa36ef29576 β†’ BA_Udemy_Berufe/7611ee46-6912-4fba-9d4f-830c52f852f9}/header.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7ffd5ef9bb9ca1a421e18216d2997eea01192524736b484b49cd43b46e42e31f
3
  size 100
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7d53ddf53cd122b7667711e9b5a4fb474c0a32263ca4f34857b263d16438ab2
3
  size 100
app/data/{multilingual-e5_cos_escoai/c4b78092-a1fa-41fc-b6b0-8fa36ef29576 β†’ BA_Udemy_Berufe/7611ee46-6912-4fba-9d4f-830c52f852f9}/index_metadata.pickle RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9f91c55d437d031ea4094c2a2c3e35e0aec42eb5d5f60821d7b164f714228dbe
3
- size 346049
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:113271d35a2fc518053f5f0bd1bab69aa967b48584e4c1f86237e19ae05aa4c8
3
+ size 1274271
app/data/{multilingual-e5_cos_escoai/c4b78092-a1fa-41fc-b6b0-8fa36ef29576 β†’ BA_Udemy_Berufe/7611ee46-6912-4fba-9d4f-830c52f852f9}/length.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1d3b0223a8c3ef4338003b319ca7fe73feb39b300f9dc618e6a9373083b59f6a
3
- size 24000
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9cdb71300efa91ff069b85d3f7ea68860b2adb28e6de147181f8c909f2880c68
3
+ size 88000
app/data/{multilingual-e5_cos_escoai/c4b78092-a1fa-41fc-b6b0-8fa36ef29576 β†’ BA_Udemy_Berufe/7611ee46-6912-4fba-9d4f-830c52f852f9}/link_lists.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:95c0583c98e9b4f9d1694015eb8a2bd782fca6f6ad14d7580ba83b1ced231e26
3
- size 51880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0579396dd94f5f59ceedbff20c70ed7651fd81156dc8aeb2f96c1933a2520661
3
+ size 185240
app/data/{multilingual-e5_cos_escoai β†’ BA_Udemy_Berufe}/chroma.sqlite3 RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e5e1bfab026e95b44810b2284b3f82d10871fcd4242aa122e31fa84e27195209
3
- size 103567360
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f750f020317722571b8dc8d1cd72927e7ba6207a84652ef08be31a6ed27cba80
3
+ size 349016064
app/embedding_setup.py CHANGED
@@ -2,8 +2,7 @@ from langchain_community.vectorstores import Chroma
2
  from langchain_community.embeddings import HuggingFaceBgeEmbeddings
3
 
4
  from langchain.docstore.document import Document
5
- from transformers import AutoModelForCausalLM, AutoTokenizer, GenerationConfig,BitsAndBytesConfig
6
- from peft import PeftModel
7
  from config import *
8
  import os
9
  import torch
 
2
  from langchain_community.embeddings import HuggingFaceBgeEmbeddings
3
 
4
  from langchain.docstore.document import Document
5
+ from transformers import AutoTokenizer
 
6
  from config import *
7
  import os
8
  import torch