-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathDaturing.py
More file actions
66 lines (46 loc) · 1.83 KB
/
Daturing.py
File metadata and controls
66 lines (46 loc) · 1.83 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
import os
from langchain.chat_models import init_chat_model
from langchain_google_genai import ChatGoogleGenerativeAI
from langchain_core.tools import tool
from langchain_core.prompts import ChatPromptTemplate, MessagesPlaceholder
import json
from IPython.display import display
import ipywidgets as widgets
from typing import Annotated
from typing_extensions import TypedDict
from langgraph.graph import StateGraph, START, END
from langgraph.graph.message import add_messages
import pandas as pd
# Widget para upload do arquivo
upload = widgets.FileUpload(accept='.json', multiple=False)
display(upload)
if not os.environ.get("GOOGLE_API_KEY"):
os.environ["GOOGLE_API_KEY"] = "AIzaSyDPpd_Wed8QgLL29C8TD6jl1kVWGfHzZxo"
llm = init_chat_model("google_genai:gemini-2.0-flash")
def get_dataset_from_upload(upload_widget):
if upload_widget.value:
file_info = list(upload_widget.value.values())[0]
dataset = pd.read_json(file_info['content'])
return dataset
else:
return {}
class State(TypedDict):
user_queries: Annotated[list, add_messages]
ai_messages: Annotated[list, add_messages]
dataset: pd.DataFrame # Dados do .json
generated_code: Annotated[list, add_messages] # Código gerado pela IA
def Node_input(state: State):
# Widget para upload do arquivo
upload = widgets.FileUpload(accept='.json', multiple=False)
display(upload)
state["dataset"] = get_dataset_from_upload(upload)
state["user_queries"].append(input("Digite sua consulta de análise:"))
return state
def limpezaDeDados(state: State):
# Faz uma limpeza nos dados
df = state["dataset"].copy()
temp = (base_de_dados.isnull().sum() / base_de_dados.shape[0]) >= 0.9
variaveis_Faltantes = temp.loc[temp == True].index.tolist()
for v in variaveis_Faltantes:
df = df.drop(v, axis = 1)
return df