Spaces:

Project-nlp
/

nlp-bert-team

Sleeping

App Files Files Community

VerVelVel commited on May 31, 2024

Commit

6a8cbcb

1 Parent(s): cdb0abe

pochti final

Browse files

Files changed (7) hide show

bot/bot.py +1 -1
images/toxity_metrics.png +0 -0
models/model2/__pycache__/model.cpython-310.pyc +0 -0
models/model2/__pycache__/preprocess_text.cpython-310.pyc +0 -0
models/model2/model_weights.pth +0 -3
pages/comments.py +0 -70
pages/policlinic.py +0 -17

bot/bot.py CHANGED Viewed

@@ -29,7 +29,7 @@ start_keyboard = ReplyKeyboardMarkup(
 @lru_cache(maxsize=1)
 def load_model():
     model = BERTClassifier()
-    weights_path = 'bot/model_weights.pth'
     state_dict = torch.load(weights_path, map_location=device)
     model.load_state_dict(state_dict)
     model.to(device)

 @lru_cache(maxsize=1)
 def load_model():
     model = BERTClassifier()
+    weights_path = 'bot/model_weights_new.pth'
     state_dict = torch.load(weights_path, map_location=device)
     model.load_state_dict(state_dict)
     model.to(device)

images/toxity_metrics.png DELETED Viewed

Binary file (50.2 kB)

models/model2/__pycache__/model.cpython-310.pyc CHANGED Viewed

Binary files a/models/model2/__pycache__/model.cpython-310.pyc and b/models/model2/__pycache__/model.cpython-310.pyc differ

models/model2/__pycache__/preprocess_text.cpython-310.pyc CHANGED Viewed

Binary files a/models/model2/__pycache__/preprocess_text.cpython-310.pyc and b/models/model2/__pycache__/preprocess_text.cpython-310.pyc differ

models/model2/model_weights.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:0b84f9c8041dd44751288c4777723fb4ff4b3886423f9f6efca37e43c6492429
-size 47712485

pages/comments.py DELETED Viewed

@@ -1,70 +0,0 @@
-import streamlit as st
-import torch
-import sys
-from pathlib import Path
-import requests
-import time
-import cv2
-import numpy as np
-from transformers import AutoTokenizer
-st.write("# Оценка степени токсичности пользовательского сообщения")
-# st.write("Здесь вы можете загрузить картинку со своего устройства, либо при помощи ссылки")
-# Добавление пути к проекту и моделям
-project_root = Path(__file__).resolve().parents[1]
-models_path = project_root / 'models'
-sys.path.append(str(models_path))
-from models.model2.preprocess_text import TextPreprocessorBERT
-from models.model2.model import BERTClassifier
-device = 'cpu'
-# Загрузка модели и словаря
-@st.cache_resource
-def load_model():
-    model = BERTClassifier()
-    weights_path = models_path / 'model2' / 'model_weights_new.pth'
-    state_dict = torch.load(weights_path, map_location=device)
-    model.load_state_dict(state_dict)
-    model.to(device)
-    model.eval()
-    return model
-@st.cache_resource
-def load_tokenizer():
-    return AutoTokenizer.from_pretrained('cointegrated/rubert-tiny-toxicity')
-model = load_model()
-tokenizer = load_tokenizer()
-input_text = st.text_area('Введите текст сообщения')
-if st.button('Предсказать'):
-    # Применяем предобработку
-    preprocessor = TextPreprocessorBERT()
-    preprocessed_text = preprocessor.transform(input_text)
-    # Токенизация
-    tokens = tokenizer.encode_plus(
-        preprocessed_text,
-        add_special_tokens=True,
-        truncation=True,
-        max_length=100,
-        padding='max_length',
-        return_tensors='pt'
-    )
-    # Получаем input_ids и attention_mask из токенов
-    input_ids = tokens['input_ids'].to(device)
-    attention_mask = tokens['attention_mask'].to(device)
-    # Предсказание
-    with torch.no_grad():
-        output = model(input_ids, attention_mask=attention_mask)
-    # Интерпретация результата
-    prediction = torch.sigmoid(output).item()
-    st.write(f'Предсказанный класс токсичности: {prediction:.4f}')

pages/policlinic.py DELETED Viewed

@@ -1,17 +0,0 @@
-import streamlit as st
-import joblib
-import pandas as pd
-from models.model1.Custom_class import TextPreprocessor
-# Load the trained pipeline
-pipeline = joblib.load('models/model1/logistic_regression_pipeline.pkl')
-# Streamlit application
-st.title('Классификация отзывов на русском языке')
-input_text = st.text_area('Введите текст отзыва')
-if st.button('Предсказать'):
-    prediction = pipeline.predict(pd.Series([input_text]))
-    st.write(f'Предсказанный класс с помощью логрег: {prediction[0]}')
-    st.write(f'1 - negative, 0 - positive')