123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194 |
- # -*- coding:utf-8 -*-
- if __name__ == '__main__':
- import os
- os.chdir("..")
- import requests
- import random
- import json
- import time
- from tools.loglog import logger,simple_logger
- from tools.new_mysql import MySQLUploader
- from typing import Optional, Dict, Any,Union
- import httpx
- import asyncio
- m = MySQLUploader()
- def get_openai_model(model_text:str):
- """模糊获得模型名"""
- if "3.5" in model_text or "3.5-turbo" in model_text or "3.5turbo" in model_text:
- model = "gpt-3.5-turbo"
- elif "4o" in model_text or "gpt4o" in model_text:
- model = "gpt-4o"
- elif "4turbo" in model_text or "4-turbo" in model_text:
- model = "gpt-4-turbo"
- else:
- model = "gpt-4o"
- return model
- def insert_ip_token(ip,demo_name,gpt_content,prompt_tokens,completion_tokens,total_tokens):
- sql = "insert into consumer_token (ip,demo_name,gpt_content,prompt_tokens,completion_tokens,total_tokens) values (%s,%s,%s,%s,%s,%s)"
- m.execute_(sql,(ip,demo_name,str(gpt_content),prompt_tokens,completion_tokens,total_tokens))
- def get_answer_from_gpt(question,real_ip="localhost",demo_name="无",model="gpt-4o",max_tokens=3500,temperature:float=0,
- json_resp:Union[Dict[Any, Any],bool]=False,n=1,check_fucn=None,sys_prompt=None):
- model = get_openai_model(model)
-
- d2 = {"model": model,"messages": [],"max_tokens": max_tokens,"temperature": temperature,'n': n}
- if sys_prompt:
- d2['messages'].append({"role": "system", "content": sys_prompt})
- d2['messages'].append({"role": "user", "content": question})
- if json_resp is True:
- d2["response_format"] = {"type": "json_object"}
- elif json_resp is False:
- pass
- else:
- d2["response_format"] = json_resp
- for num_count in range(3):
- try:
-
- response = requests.post(f'http://170.106.108.95/v1/chat/completions', json=d2)
- r_json = response.json()
- if r2:= r_json.get("choices",None):
- if n>1:
- gpt_res = []
- for i in r2:
- gpt_res.append(i["message"]["content"])
- else:
- gpt_res= r2[0]["message"]["content"]
-
- gpt_content = str(gpt_res)
- prompt_tokens = r_json["usage"]["prompt_tokens"]
- completion_tokens = r_json["usage"]["completion_tokens"]
- total_tokens = r_json["usage"]["total_tokens"]
- insert_ip_token(real_ip,demo_name,gpt_content,prompt_tokens,completion_tokens,total_tokens)
- simple_logger.info(f"问题日志:\n{question}\n回答日志:\n{gpt_res}")
-
- if not check_fucn:
- return gpt_res
-
- check_result = check_fucn(str(gpt_res))
- if check_result:
- return gpt_res
- else:
- raise Exception(f"第{num_count+1}次共3次,GPT的校验没有通过,校验函数:{check_fucn.__name__}")
- elif r_json.get("message") == "IP address blocked":
- print("IP address blocked")
- raise Exception("IP address blocked")
- else:
- print(f"小错误:{question[:10]}")
- logger.error(response.text)
- except Exception as e:
- logger.info(f"小报错忽略{e}")
- time.sleep(10)
- logger.critical("get_answer_from_gpt 严重错误,3次后都失败了")
- async def get_article_gpt_pydantic(question, real_ip="localhost", demo_name="无", model="gpt-4o", max_tokens=3500, temperature:float=0, n=1,
- check_fucn=None, sys_prompt=None, client=None):
- """
- 异步获取文章
- :param question: 问题
- :param real_ip: 真实IP
- :param demo_name: 项目名称
- :param model: 模型名称
- :param max_tokens: 最大token数
- :param temperature: 温度
- :param n: 生成数量
- :param check_fucn: 校验函数
- :param sys_prompt: 系统提示
- :param client: httpx.AsyncClient实例
- :return: 文章内容
- """
-
- d2 = {"model": model, "messages": [], "max_tokens": max_tokens, "temperature": temperature, "response_format":"article"}
- if sys_prompt:
- d2['messages'].append({"role": "system", "content": sys_prompt})
- d2['messages'].append({"role": "user", "content": question})
- for num_count in range(3):
- try:
-
- if client is None:
- async with httpx.AsyncClient() as temp_client:
- response = await temp_client.post('http://170.106.108.95/get_article', json=d2)
- else:
- response = await client.post('http://170.106.108.95/get_article', json=d2)
-
- r_str = response.json()
- simple_logger.info(f"问题日志:\n{question}\n回答日志:\n{r_str}")
-
- if not check_fucn:
- return r_str
-
- check_result = check_fucn(r_str)
- if check_result:
- return r_str
- else:
- raise Exception(f"第{num_count + 1}次共3次,GPT的校验没有通过,校验函数:{check_fucn.__name__}")
- except httpx.HTTPError as e:
- logger.error(f"HTTP请求错误: {str(e)}")
- if num_count < 2:
- await asyncio.sleep(10)
- else:
- raise
- except Exception as e:
- logger.error(f"其他错误: {str(e)}")
- if num_count < 2:
- await asyncio.sleep(10)
- else:
- raise
- logger.critical("get_article_gpt_pydantic 严重错误,3次后都失败了")
- raise Exception("获取文章失败,已达到最大重试次数")
- def parse_gpt_phon_to_tuplelist(text:str) -> list:
- """解析gpt返回的音标数据"""
- result = []
- if not text:
- return []
- for i in text.split("\n"):
- ii = i.split("***")
- if len(ii)>=3:
- result.append((ii[0].strip(),ii[1].strip(),ii[2].strip()))
- return result
- if __name__ == '__main__':
- question = "hello"
-
- sys_prompt = "你是一个专业的英语老师,擅长根据用户提供的词汇生成对应的英语文章和中文翻译和4个配套选择题。"
- q= """下面我会为你提供两组数据,[单词组1]和[单词组2](里面包含词义id,英语单词,中文词义),优先使用[单词组1]内的单词,请根据这些单词的中文词义,生成一篇带中文翻译的考场英语文章,英语文章和中文翻译要有[标题]。注意这个单词有多个词义时,生成的英语文章一定要用提供的中文词义。并挑选一句复杂的句子和其中文翻译,放入difficultSentences。英语文章,放入"englishArticle"中。中文翻译,放入"chineseArticle"中。最终文中使用到的单词id放入"usedMeanIds"中。4个选择题,放入questions字段。questions结构下有4个选择题对象,其中trunk是[英语]问题文本,analysis是[中文]的问题分析,candidates是4个ABCD选项,内部有label是指选项序号A B C D ,text是[英语]选项文本,isRight是否正确答案1是正确0是错误。
- 要求:
- 1.必须用提供的这个词义的单词,其他单词使用常见、高中难度的的单词。文章整体难度适中,大约和中国的高中生,中国CET-6,雅思6分这样的难度标准。
- 2.优先保证文章语句通顺,意思不要太生硬。不要为了使用特定的单词,造成文章语义前后不搭,允许不使用个别词义。
- 3.文章中使用提供单词,一定要和提供单词的中文词义匹配,尤其是一词多义时,务必使用提供单词的词义。必须要用提供单词的词义。如果用到的词义与提供单词词义不一致,请不要使用这个单词。
- 4.生成的文章要求600词左右,可以用\\n\\n字符分段,一般5个段落左右。第一段是文章标题。
- 5.生成文章优先使用[单词组1]的词义,其次可以挑选使用[单词组2]的词义。允许不使用[单词组1]的个别单词,优先保证文章整体意思通顺连贯和故事完整。
- 提供[单词组1]:4238 penalty:惩罚, 刑罚;4591 bare:赤裸的, 无遮蔽的;4227 stable:畜舍, 马厩;4236 psychology:心理学;4245 offense:进攻, 攻势, 冒犯, 触怒, 过错;4237 innocent:清白的, 无辜的, 天真的;4228 refrigerator:冰箱, 冷库;4247 tissue:(动植物)组织;4250 awareness:察觉, 觉悟, 意识;4234 mode:方式, 模式;4224 neat:整洁, 利索;4225 statistics:统计;4251 random:任意的, 随机的;4201 laundry:洗衣房;4545 barrel:桶, 一桶之量;4249 recruit:招募, 新成员;4229 pregnant:怀孕的, 孕育的;4235 relevant:有关的, 相关联的;4252 incentive:刺激, 激励, 鼓励;4194 grave:坟墓, 墓穴;
- 提供[单词组2]:;
- """
- resp = get_article_gpt_pydantic(question=q,temperature=0.9,sys_prompt=sys_prompt,model="gpt-4.1")
- print(type(resp))
- print(resp)
|