-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathai_handler.rb
253 lines (201 loc) · 8.26 KB
/
ai_handler.rb
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
class EmptyVoiceMessageException < StandardError; end
class AiHandler
def initialize
@api_token = BotConfig.config['openai']['token']
return if @api_token.empty?
@recognize_plugins = BotConfig.config['openai']['recognize_plugins']
@personality = File.read(BotConfig.config['openai']['personality_file'])
@plugins_list_prompt_segment = ''
@chat_prompt_history = []
@text_to_command_training = [
{
role: 'system',
content: 'You are a text to command converter, you will only reply with commands given a text by a user and nothing else. I will give you some examples of commands and when a command is not found in these examples, you must reply with UNRECOGNIZED.',
}
]
first_example_plugin_commands = []
Logging.log.info 'Initialized OpenAI client'
@client = OpenAI::Client.new(access_token: @api_token)
if @recognize_plugins
Logging.log.info 'Loading plugins examples for text to command prompt...'
AbsPlugin.descendants.each do |plugin|
plugin_instance = plugin.new
examples_list = plugin_instance.examples
examples_match_commands = examples_list.map { |example| plugin_instance.command.match?(example[:command]) }.all?
if !examples_match_commands
Logging.log.warn "#{plugin_instance.class.name} plugin examples don't match the command!"
end
if !examples_list.empty? && examples_match_commands
first_example_plugin_commands.push(examples_list[0][:command])
@text_to_command_training += examples_list.map do |item|
[
{ role: 'user', content: item[:description] },
{ role: 'assistant', content: item[:command] }
]
end.flatten
end
end
@text_to_command_training += [
{ role: 'user', content: 'Let\'s start a new conversation' }
]
@plugins_list_prompt_segment = "Joshua can also reply just with the following commands: #{first_example_plugin_commands.join(' ')}"
end
end
def ask(bot, user_message, message_text)
return if @api_token.empty?
matched_plugin = false
user_sent_image = false
nested_matched_plugin = false
response_text = ''
chat_prompt_header = <<~PROMPT
You are Joshua a helpful chatbot who enjoys chatting with any human who interacts with him.
#{@personality}#{@plugins_list_prompt_segment.empty? ? '' : "\n#{@plugins_list_prompt_segment}\n"}
PROMPT
.chomp
# if user sends voice message use whisper to transcribe it
# and then use the text for interpreting plugin commands or chatgpt interaction
unless user_message.voice.nil?
file_url = JSON.parse(RestClient.get("https://api.telegram.org/bot#{BotConfig.config['token']}/getFile?file_id=#{user_message.voice.file_id}"))
audio_file_url = "https://api.telegram.org/file/bot#{BotConfig.config['token']}/#{file_url['result']['file_path']}"
local_audio_file = "#{BotConfig.config['temp_directory']}/msg_audio_#{user_message.voice.file_id}"
Logging.log.info 'Downloading voice message and converting to mp3...'
system("wget #{audio_file_url} -O #{local_audio_file}.ogg")
system("ffmpeg -i #{local_audio_file}.ogg -acodec libmp3lame -aq 4 #{local_audio_file}.mp3")
Logging.log.info 'Sending audio file to OpenAI for transcription...'
transcription = transcribe("#{local_audio_file}.mp3")
Logging.log.info "Message transcribed received: \"#{transcription}\""
File.delete("#{local_audio_file}.ogg", "#{local_audio_file}.mp3")
raise EmptyVoiceMessageException if transcription.empty?
message_text = transcription
end
unless user_message.photo.nil?
file_url = JSON.parse(RestClient.get("https://api.telegram.org/bot#{BotConfig.config['token']}/getFile?file_id=#{user_message.photo[-1].file_id}"))
photo_file_url = "https://api.telegram.org/file/bot#{BotConfig.config['token']}/#{file_url['result']['file_path']}"
message_text = []
if user_message.caption.nil?
message_text.push({ type: 'text', text: "What's in this image?" })
else
message_text.push({ type: 'text', text: user_message.caption })
end
message_text.push({
type: 'image_url',
image_url: {
url: photo_file_url
}
})
user_sent_image = true
end
@chat_prompt_history.push(
{
role: 'user',
content: message_text
}
)
if @recognize_plugins && !user_sent_image
user_command_request = @text_to_command_training.clone
user_command_request.push(
{
role: 'user',
content: message_text
}
)
Logging.log.info 'Sending plugin prompt to OpenAI...'
Logging.log.info "Plugin training sent:\n#{user_command_request}" if BotConfig.config['openai']['log_prompts']
bot.api.sendChatAction(chat_id: user_message.chat.id, action: 'typing')
response_text = send_interpret_command(user_command_request)
Logging.log.info "Command received from OpenAI: \"#{response_text}\""
matched_plugin = PluginHandler.handle(bot, user_message, response_text, false)
end
if !matched_plugin || !@recognize_plugins
chat_prompt_system = [
{
role: 'system',
content: chat_prompt_header
}
]
combined_conversation = chat_prompt_system + @chat_prompt_history
Logging.log.info 'Sending chat conversation to OpenAI...'
Logging.log.info "Chat prompt sent:\n#{combined_conversation}" if BotConfig.config['openai']['log_prompts']
bot.api.sendChatAction(chat_id: user_message.chat.id, action: 'typing')
response_text = if user_sent_image
send_chat_image(combined_conversation)
else
send_chat_prompt(combined_conversation)
end
Logging.log.info "Response received: #{response_text}"
if response_text.match?(%r{.*(\/[a-zA-Z]*?)$})
Logging.log.info 'Matched a command in the reply from OpenAI'
possible_command = response_text.match(%r{.*(\/[a-zA-Z]*?)$})
bot.api.send_message(chat_id: user_message.chat.id, text: response_text)
nested_matched_plugin = PluginHandler.handle(bot, user_message, possible_command[1], false)
end
if !nested_matched_plugin
bot.api.send_message(chat_id: user_message.chat.id, text: response_text)
end
end
@chat_prompt_history.push(
{
role: 'assistant',
content: response_text
}
)
# the number two represents a couple of question (user) answer (assistant)
if (@chat_prompt_history.size / 2) > BotConfig.config['openai']['max_interaction_history']
2.times { @chat_prompt_history.shift }
end
rescue EmptyVoiceMessageException
Logging.log.error 'Received empty transcription from OpenAI!'
bot.api.send_message(
chat_id: user_message.chat.id,
text: 'Sorry, not sure I caught that, could you repeat it again? ',
reply_to_message_id: user_message.message_id
)
rescue => e
Logging.log.error "Something went horribly wrong:\n#{e.message}\n#{e.backtrace.join("\n")}"
bot.api.send_message(
chat_id: user_message.chat.id,
text: 'Sorry, feeling a bit dizzy today, could you repeat that again? 😵💫',
reply_to_message_id: user_message.message_id
)
end
private
def transcribe(file_audio_path)
response = @client.audio.transcribe(
parameters: {
model: 'whisper-1',
file: File.open(file_audio_path, 'rb')
}
)
response['text']
end
def send_chat_image(conversation)
response = @client.chat(
parameters: {
model: 'gpt-4o',
messages: conversation,
temperature: 0.5
}
)
response.dig('choices', 0, 'message', 'content')
end
def send_chat_prompt(conversation)
response = @client.chat(
parameters: {
model: 'gpt-4-turbo',
messages: conversation,
temperature: 0.5
}
)
response.dig('choices', 0, 'message', 'content')
end
def send_interpret_command(user_command_request)
response = @client.chat(
parameters: {
model: 'gpt-4',
messages: user_command_request,
temperature: 0
}
)
response.dig('choices', 0, 'message', 'content')
end
end