Intents.JSON mit Umlaute zeigt nicht richtig in Python
Verfasst: Dienstag 14. September 2021, 19:24
data_file = open('intents.json').read()
intents = json.loads(data_file)
Intents hat deutsche Umlaute und diese werden in meinem Chatbot nicht korrekt angezeigt.
Ich Danke für die Hilfe.
Code
#!/usr/bin/python
# -*- coding: utf-8 -*-
import nltk
from nltk.stem import WordNetLemmatizer
lemmatizer = WordNetLemmatizer()
import pickle
import numpy as np
from tensorflow.keras.models import load_model
import json
import random
data_file = open('intents.json').read()
intents = json.load(data_file)
words = pickle.load(open('words.pkl','rb'))
classes = pickle.load(open('classes.pkl','rb'))
model = load_model('chatbot_model.h5')
def clean_up_sentence(sentence):
# tokenize the pattern - split words into array
sentence_words = nltk.word_tokenize(sentence)
# stem each word - create short form for word
sentence_words = [lemmatizer.lemmatize(word.lower()) for word in sentence_words]
return sentence_words
# return bag of words array: 0 or 1 for each word in the bag that exists in the sentence
def bow(sentence, words, show_details=True):
# tokenize the pattern
sentence_words = clean_up_sentence(sentence)
# bag of words - matrix of N words, vocabulary matrix
bag = [0]*len(words)
for s in sentence_words:
for i,w in enumerate(words):
if w == s:
# assign 1 if current word is in the vocabulary position
bag = 1
if show_details:
print ("found in bag: %s" % w)
return(np.array(bag))
def predict_class(sentence, model):
# filter out predictions below a threshold
p = bow(sentence, words,show_details=False)
res = model.predict(np.array([p]))[0]
ERROR_THRESHOLD = 0.25
results = [[i,r] for i,r in enumerate(res) if r>ERROR_THRESHOLD]
# sort by strength of probability
results.sort(key=lambda x: x[1], reverse=True)
return_list = []
for r in results:
return_list.append({"intent": classes[r[0]], "probability": str(r[1])})
return return_list
def getResponse(ints, intents_json):
tag = ints[0]['intent']
list_of_intents = intents_json['intents']
for i in list_of_intents:
if(i['tag']== tag):
result = random.choice(i['responses'])
break
return result
def chatbot_response(msg):
ints = predict_class(msg, model)
res = getResponse(ints, intents)
return res
#Creating GUI with tkinter
import tkinter
from tkinter import *
from PIL import Image, ImageTk
def send():
msg = EntryBox.get("1.0",'end-1c').strip()
EntryBox.delete("0.0",END)
if msg != '':
ChatLog.config(state=NORMAL)
ChatLog.insert(END, "You: " + msg + '\n\n')
ChatLog.config(foreground="#442265", font=("Verdana", 12 ))
res = chatbot_response(msg)
ChatLog.insert(END, "Bot: " + res + '\n\n')
ChatLog.config(state=DISABLED)
ChatLog.yview(END)
base = tkinter.Tk()
base.title("Borat")
base.geometry("400x500")
base.resizable(width=TRUE, height=TRUE)
#Create Chat window
ChatLog = Text(base, bd=0, bg="white",font="Arial")
ChatLog.config(state=DISABLED)
ChatLog.pack(side="right", fill="y", expand=True, padx=5, pady=5)
#Bind scrollbar to Chat window
scrollbar = Scrollbar(base, command=ChatLog.yview, cursor="heart")
ChatLog['yscrollcommand'] = scrollbar.set
image = Image.open(r"C:\Users\pavilion\Desktop\ChatBot\mail.png")
resize_image = image.resize((68,65))
img = ImageTk.PhotoImage(resize_image)
#Create Button to send message
SendButton = tkinter.Button(base, image=img, cursor="dot",
relief=FLAT, command= send)
##font=("Arial",12,'bold'), text="send", width="10", height=2, highlightcolor="#e1c4c5", bg="#32de97", activebackground="#3c9d9b",fg='#ffffff',##
#Create the box to enter message
EntryBox = Text(base, bd=0, bg="white", font="Arial")
EntryBox.bind('<Return>', send)
EntryBox.pack(side="top", fill="both", expand=True, padx=0, pady=0)
#Place all components on the screen
ChatLog.place(x=6,y=6, height=386, width=370)
EntryBox.place(x=80, y=401, height=90, width=265)
scrollbar.place(x=376,y=6, height=386)
SendButton.place(x=5, y=410, height=71, width=70)
base.mainloop()
intents = json.loads(data_file)
Intents hat deutsche Umlaute und diese werden in meinem Chatbot nicht korrekt angezeigt.
Ich Danke für die Hilfe.
Code
#!/usr/bin/python
# -*- coding: utf-8 -*-
import nltk
from nltk.stem import WordNetLemmatizer
lemmatizer = WordNetLemmatizer()
import pickle
import numpy as np
from tensorflow.keras.models import load_model
import json
import random
data_file = open('intents.json').read()
intents = json.load(data_file)
words = pickle.load(open('words.pkl','rb'))
classes = pickle.load(open('classes.pkl','rb'))
model = load_model('chatbot_model.h5')
def clean_up_sentence(sentence):
# tokenize the pattern - split words into array
sentence_words = nltk.word_tokenize(sentence)
# stem each word - create short form for word
sentence_words = [lemmatizer.lemmatize(word.lower()) for word in sentence_words]
return sentence_words
# return bag of words array: 0 or 1 for each word in the bag that exists in the sentence
def bow(sentence, words, show_details=True):
# tokenize the pattern
sentence_words = clean_up_sentence(sentence)
# bag of words - matrix of N words, vocabulary matrix
bag = [0]*len(words)
for s in sentence_words:
for i,w in enumerate(words):
if w == s:
# assign 1 if current word is in the vocabulary position
bag = 1
if show_details:
print ("found in bag: %s" % w)
return(np.array(bag))
def predict_class(sentence, model):
# filter out predictions below a threshold
p = bow(sentence, words,show_details=False)
res = model.predict(np.array([p]))[0]
ERROR_THRESHOLD = 0.25
results = [[i,r] for i,r in enumerate(res) if r>ERROR_THRESHOLD]
# sort by strength of probability
results.sort(key=lambda x: x[1], reverse=True)
return_list = []
for r in results:
return_list.append({"intent": classes[r[0]], "probability": str(r[1])})
return return_list
def getResponse(ints, intents_json):
tag = ints[0]['intent']
list_of_intents = intents_json['intents']
for i in list_of_intents:
if(i['tag']== tag):
result = random.choice(i['responses'])
break
return result
def chatbot_response(msg):
ints = predict_class(msg, model)
res = getResponse(ints, intents)
return res
#Creating GUI with tkinter
import tkinter
from tkinter import *
from PIL import Image, ImageTk
def send():
msg = EntryBox.get("1.0",'end-1c').strip()
EntryBox.delete("0.0",END)
if msg != '':
ChatLog.config(state=NORMAL)
ChatLog.insert(END, "You: " + msg + '\n\n')
ChatLog.config(foreground="#442265", font=("Verdana", 12 ))
res = chatbot_response(msg)
ChatLog.insert(END, "Bot: " + res + '\n\n')
ChatLog.config(state=DISABLED)
ChatLog.yview(END)
base = tkinter.Tk()
base.title("Borat")
base.geometry("400x500")
base.resizable(width=TRUE, height=TRUE)
#Create Chat window
ChatLog = Text(base, bd=0, bg="white",font="Arial")
ChatLog.config(state=DISABLED)
ChatLog.pack(side="right", fill="y", expand=True, padx=5, pady=5)
#Bind scrollbar to Chat window
scrollbar = Scrollbar(base, command=ChatLog.yview, cursor="heart")
ChatLog['yscrollcommand'] = scrollbar.set
image = Image.open(r"C:\Users\pavilion\Desktop\ChatBot\mail.png")
resize_image = image.resize((68,65))
img = ImageTk.PhotoImage(resize_image)
#Create Button to send message
SendButton = tkinter.Button(base, image=img, cursor="dot",
relief=FLAT, command= send)
##font=("Arial",12,'bold'), text="send", width="10", height=2, highlightcolor="#e1c4c5", bg="#32de97", activebackground="#3c9d9b",fg='#ffffff',##
#Create the box to enter message
EntryBox = Text(base, bd=0, bg="white", font="Arial")
EntryBox.bind('<Return>', send)
EntryBox.pack(side="top", fill="both", expand=True, padx=0, pady=0)
#Place all components on the screen
ChatLog.place(x=6,y=6, height=386, width=370)
EntryBox.place(x=80, y=401, height=90, width=265)
scrollbar.place(x=376,y=6, height=386)
SendButton.place(x=5, y=410, height=71, width=70)
base.mainloop()