4 月之前 · ea9d15c655
--- a/README.rst
+++ b/README.rst
@@ -0,0 +1,8 @@
 
															+# diviner 先知控制器
														
 
															+
														
 
															+安装
														
 
															+
														
 
															+python install.py
														
 
															+
														
 
															+前台：python front.py
														
 
															+后台：python admin.py
														
--- a/admin.py
+++ b/admin.py
@@ -0,0 +1,10 @@
 
															+#!/usr/bin/env python
														
 
															+# -*- coding: utf-8 -*-
														
 
															+"""
														
 
															+    demeter web
														
 
															+    name:admin.py
														
 
															+"""
														
 
															+from demeter.core import *
														
 
															+
														
 
															+if __name__ == "__main__":
														
 
															+	Demeter.webInit('admin')
														
--- a/admin/__init__.py
+++ b/admin/__init__.py
@@ -0,0 +1 @@
 
															+# -*- coding: utf-8 -*-
														
--- a/admin/main.py
+++ b/admin/main.py
@@ -0,0 +1,5 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from demeter.web import *
														
 
															+import demeter.admin.page as admin_page
														
 
															+import admin.page
														
 
															+Web.start(application=[admin.page,admin_page])
														
--- a/admin/page/__init__.py
+++ b/admin/page/__init__.py
@@ -0,0 +1 @@
 
															+# -*- coding: utf-8 -*-
														
--- a/admin/page/__load__.py
+++ b/admin/page/__load__.py
@@ -0,0 +1,2 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from demeter.admin.page.__load__ import *
														
--- a/admin/page/lang_model.py
+++ b/admin/page/lang_model.py
@@ -0,0 +1,55 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+
														
 
															+class lang_model_path(Load):
														
 
															+	@Web.auth
														
 
															+	@Web.setting
														
 
															+	def get(self):
														
 
															+		self.set(
														
 
															+			name = u'语言模型'
														
 
															+			,path = '/lang_model/lang_model'
														
 
															+			,width = '600'
														
 
															+			,height = '600'
														
 
															+			,search = (('label-1','cdate-time-start','cdate-time-end','name-input-mlike'), (u'日期范围',u'开始时间',u'截止时间',u'模型名称'))
														
 
															+			,thead = (u'模型名称', u'模型渠道', u'模型标识', u'创建时间')
														
 
															+			,tbody = ('name', 'channel', 'model', 'time')
														
 
															+			,state = True
														
 
															+		)
														
 
															+		self.list('lang_model')
														
 
															+		if self.data['list']:
														
 
															+			llm = Demeter.config['llm']
														
 
															+			for key, value in enumerate(self.data['list']):
														
 
															+				id = str(value['id'])
														
 
															+				self.data['list'][key]['time'] = Demeter.date(value['cdate'])
														
 
															+				self.data['list'][key]['channel'] = llm[value['channel']]
														
 
															+		self.show('list')
														
 
															+
														
 
															+class lang_model_update_path(Load):
														
 
															+	@Web.auth
														
 
															+	@Web.setting
														
 
															+	def get(self):
														
 
															+		llm = Demeter.config['llm']
														
 
															+		channel = []
														
 
															+		for key, value in llm.items():
														
 
															+			channel.append({'id':key, 'name':value})
														
 
															+		status = [
														
 
															+			{'id':'1', 'name': '正常'},
														
 
															+			{'id':'2', 'name': '封禁'},
														
 
															+		]
														
 
															+		self.set(
														
 
															+			path = '/lang_model/lang_model'
														
 
															+			,label = (u'模型名称',u'模型渠道',u'模型标识')
														
 
															+			,update = ('name-input-required','channel-select-required','model-input-required')
														
 
															+			,update_channel = channel
														
 
															+			#,update_status = status
														
 
															+		)
														
 
															+		self.one('lang_model')
														
 
															+		self.show('update')
														
 
															+	@Web.auth
														
 
															+	@Web.setting
														
 
															+	def post(self):
														
 
															+		self.update('lang_model')
														
 
															+	@Web.auth
														
 
															+	@Web.setting
														
 
															+	def delete(self):
														
 
															+		self.drop('lang_model')
														
--- a/admin/page/role.py
+++ b/admin/page/role.py
@@ -0,0 +1,77 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+"""
														
 
															+    demeter web page
														
 
															+    name:site.py 站点相关
														
 
															+    author:rabin
														
 
															+"""
														
 
															+from .__load__ import *
														
 
															+
														
 
															+class role_path(Load):
														
 
															+	@Web.auth
														
 
															+	@Web.setting
														
 
															+	def get(self):
														
 
															+		self.set(
														
 
															+			name = u'角色列表'
														
 
															+			,path = '/role/role'
														
 
															+			,width = '600'
														
 
															+			,height = '600'
														
 
															+			,edit = True
														
 
															+			,add = True
														
 
															+			,search = (('label-1','cdate-time-start','cdate-time-end','site_id-select-','status-select-','name-input-mlike'), (u'日期范围',u'开始时间',u'截止时间',u'选择站点',u'选择状态',u'角色名称'))
														
 
															+			,thead = (u'角色ID', u'角色名称', u'模型名称', u'使用次数', u'角色状态', u'创建时间')
														
 
															+			,tbody = ('id','name', 'model','use_num', 'status', 'cdate')
														
 
															+			,state = True
														
 
															+		)
														
 
															+		self.data['common']['search_site_id-select-'] = self.service('common').list('site')
														
 
															+		self.data['common']['search_status-select-'] = [{'id':1,'value':1,'name':u'正常'},{'id':2,'value':2, 'name':u'封禁'}]
														
 
															+
														
 
															+		self.list('role')
														
 
															+		status = {}
														
 
															+		status[1] = '正常'
														
 
															+		status[2] = '封禁'
														
 
															+		if self.data['list']:
														
 
															+			for key, value in enumerate(self.data['list']):
														
 
															+				site = self.service('common').one('site', id=value['site_id'])
														
 
															+				self.data['list'][key]['site'] = site['name']
														
 
															+				lang_model = self.service('common').one('lang_model', id=value['lang_model_id'])
														
 
															+				self.data['list'][key]['model'] = lang_model['name']
														
 
															+				self.data['list'][key]['status'] = status[value['status']]
														
 
															+
														
 
															+		self.show('list')
														
 
															+
														
 
															+class role_update_path(Load):
														
 
															+	@Web.auth
														
 
															+	@Web.setting
														
 
															+	def get(self):
														
 
															+		status = [
														
 
															+			{'id':'1', 'name': '正常'},
														
 
															+			{'id':'2', 'name': '封禁'},
														
 
															+		]
														
 
															+		self.set(
														
 
															+			path = '/role/role'
														
 
															+			,label = (u'所属站点', u'角色名称', u'语言模型', u'人设')
														
 
															+			,update = ('site_id-select-required', 'name-input-required', 'lang_model_id-select-', 'persona-text-required')
														
 
															+			,update_lang_model_id = self.service('common').list('lang_model')
														
 
															+			,update_site_id = self.service('common').list('site')
														
 
															+			#,update_status = status
														
 
															+		)
														
 
															+		self.one('role')
														
 
															+		self.show('update')
														
 
															+	@Web.auth
														
 
															+	@Web.setting
														
 
															+	def post(self):
														
 
															+		self.data['update']['create_uid'] = -1
														
 
															+		self.data['update']['owner_uid'] = -1
														
 
															+
														
 
															+		sid = self.update('role')
														
 
															+
														
 
															+		'''
														
 
															+		if sid:
														
 
															+			redis = Demeter.redis()
														
 
															+			config = Demeter.config['redis']
														
 
															+			redis.rpush(config['name'], sid)
														
 
															+		'''
														
 
															+	@Web.auth
														
 
															+	@Web.setting
														
 
															+	def delete(self):
														
 
															+		self.drop('role')
														
--- a/admin/page/site.py
+++ b/admin/page/site.py
@@ -0,0 +1,75 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+"""
														
 
															+    demeter web page
														
 
															+    name:site.py 站点相关
														
 
															+    author:rabin
														
 
															+"""
														
 
															+from .__load__ import *
														
 
															+
														
 
															+class site_path(Load):
														
 
															+	@Web.auth
														
 
															+	@Web.setting
														
 
															+	def get(self):
														
 
															+		self.set(
														
 
															+			name = u'站点管理'
														
 
															+			,path = '/site/site'
														
 
															+			,width = '600'
														
 
															+			,height = '600'
														
 
															+			,search = (('label-1','workdate-time-start','workdate-time-end','name-input-mlike'), (u'日期范围',u'开始时间',u'截止时间',u'站点名称'))
														
 
															+			,thead = (u'站点名称', u'快捷功能', u'授权信息', u'授权时间')
														
 
															+			,tbody = ('name', 'func', 'app', 'time')
														
 
															+			,state = True
														
 
															+		)
														
 
															+		menu = (
														
 
															+			{'name':'角色列表', 'url':'/role/role'},
														
 
															+		)
														
 
															+		self.list('site')
														
 
															+		if self.data['list']:
														
 
															+			for key, value in enumerate(self.data['list']):
														
 
															+				id = str(value['id'])
														
 
															+				self.data['list'][key]['time'] = Demeter.date(value['sdate']) + ' 至 ' + Demeter.date(value['edate'])
														
 
															+				self.data['list'][key]['app'] = u'[appid]：' + value['appid'] + u'<br />[appsecret]：' + value['appsecret']
														
 
															+				param = '?search_site_id-select-=' + id
														
 
															+				self.data['list'][key]['func'] = ''
														
 
															+				for i in menu:
														
 
															+					self.data['list'][key]['func'] = self.data['list'][key]['func'] + '<a href="'+i['url']+''+param+'">'+i['name']+'</a>&nbsp;&nbsp;&nbsp;&nbsp;'
														
 
															+		self.show('list')
														
 
															+
														
 
															+class site_update_path(Load):
														
 
															+	@Web.auth
														
 
															+	@Web.setting
														
 
															+	def get(self):
														
 
															+		self.set(
														
 
															+			path = '/site/site'
														
 
															+			,label = (u'站点名称',u'站点网址',u'通知接口',u'开始时间', u'结束时间')
														
 
															+			,update = ('name-input-required','link-input-required','api-input-required','sdate-date-required','edate-date-required')
														
 
															+		)
														
 
															+		self.one('site')
														
 
															+		self.show('update')
														
 
															+	@Web.auth
														
 
															+	@Web.setting
														
 
															+	def post(self):
														
 
															+		id = self.input('id')
														
 
															+		if not id:
														
 
															+			self.getAppId()
														
 
															+		else:
														
 
															+			info = self.service('common').one('site', id=id)
														
 
															+			if not info['appid'] or not info['appsecret']:
														
 
															+				self.getAppId()
														
 
															+		self.update('site')
														
 
															+	@Web.auth
														
 
															+	@Web.setting
														
 
															+	def delete(self):
														
 
															+		self.drop('site')
														
 
															+	@Web.auth
														
 
															+	@Web.setting
														
 
															+	def getAppId(self):
														
 
															+		self.data['update']['appid'] = Demeter.compressUuid(Demeter.uuid('convert'))
														
 
															+		self.data['update']['appsecret'] = Demeter.hash()
														
 
															+
														
 
															+		model = Demeter.model('site')
														
 
															+		model.appid = self.data['update']['appid']
														
 
															+		model.appsecret = self.data['update']['appsecret']
														
 
															+		info = model.select(type='fetchone')
														
 
															+		if info:
														
 
															+			self.getAppId()
														
--- a/check.py
+++ b/check.py
@@ -0,0 +1,23 @@
 
															+#!/usr/bin/env python
														
 
															+# -*- coding: utf-8 -*-
														
 
															+import time
														
 
															+import os
														
 
															+timeSleep = 15
														
 
															+
														
 
															+def popen(command, bg=False):
														
 
															+        string = command
														
 
															+        if bg == True:
														
 
															+                command = command + ' &'
														
 
															+        process = os.popen(command)
														
 
															+        output = process.read()
														
 
															+        process.close()
														
 
															+        return output
														
 
															+
														
 
															+def process():
														
 
															+        command = 'python /data/dm/container/web/master_cron.py 1>/dev/null 2>&1 &'
														
 
															+        check = 'ps -ef | grep master_cron.py | grep -v grep | wc -l'
														
 
															+        value = int(popen(check))
														
 
															+        if value == 0:
														
 
															+                popen(command)
														
 
															+
														
 
															+process()
														
--- a/conf/dev.conf
+++ b/conf/dev.conf
@@ -0,0 +1,96 @@
 
															+[base]
														
 
															+;开发环境配置
														
 
															+[setting]
														
 
															+name				= 先知控制器
														
 
															+site				= http://diviner.shemic.com/doc/
														
 
															+copyright			= 2025 shemic.com v1.0.0
														
 
															+
														
 
															+;打印路由表
														
 
															+route				= True
														
 
															+
														
 
															+[db]
														
 
															+rdb					= sqlite
														
 
															+
														
 
															+[sqlite]
														
 
															+file                = diviner
														
 
															+;允许自动建表
														
 
															+create              = True
														
 
															+
														
 
															+[mysql]
														
 
															+host				= 0.0.0.0
														
 
															+port				= 3306
														
 
															+username			= root
														
 
															+password			= 123456
														
 
															+dbname				= diviner
														
 
															+prefix				= oc
														
 
															+charset				= utf8
														
 
															+;允许自动建表
														
 
															+create				= True
														
 
															+
														
 
															+[redis]
														
 
															+host				= 127.0.0.1
														
 
															+password			= dm_redis_123
														
 
															+port				= 6379
														
 
															+name				= diviner
														
 
															+prefix				= shemic_
														
 
															+
														
 
															+;定义一些tornado的配置，可为空
														
 
															+[tornado]
														
 
															+
														
 
															+;后台配置
														
 
															+[admin]
														
 
															+port				= 8087
														
 
															+debug				= True
														
 
															+;请求的buffersize
														
 
															+max_buffer_size		= 210763776
														
 
															+;子进程
														
 
															+process				= 0
														
 
															+;定义后台父级菜单
														
 
															+menu_parent			= 站点设置:&#xe62e;
														
 
															+;定义后台子级菜单
														
 
															+menu_child			= 站点管理:/site/site,语言模型:/lang_model/lang_model
														
 
															+
														
 
															+;cookie
														
 
															+cookie_secret       = 61oETzKXQAGaYekL5gEmGeJJFuYh7EQnp2XdTP1o/Vo=
														
 
															+login_url           = /user/login
														
 
															+;是否使用安全cookie
														
 
															+xsrf_cookies        = True
														
 
															+
														
 
															+;前台配置
														
 
															+[front]
														
 
															+port				= 8089
														
 
															+debug				= True
														
 
															+;请求的buffersize
														
 
															+max_buffer_size		= 210763776
														
 
															+;子进程
														
 
															+process				= 0
														
 
															+;支持手机版
														
 
															+mobile				= True
														
 
															+
														
 
															+;llm大模型配置
														
 
															+[llm]
														
 
															+dp                  = deepseek
														
 
															+baidu               = 文心一言
														
 
															+ali                 = 阿里
														
 
															+moonshot            = 月之暗面
														
 
															+zhipu               = 智普AI
														
 
															+spark               = 讯飞星火
														
 
															+[baidu]
														
 
															+QIANFAN_AK               = hhpP53ks4dbiCaOjYIWABRFd
														
 
															+QIANFAN_SK               = xhXgsFZCQQ4xTqOuYey4Qpp3FBm2Iunx
														
 
															+[dp]
														
 
															+api_key = 1111
														
 
															+[ali]
														
 
															+api_key = sk-4d894d18ec194c498b8fc7e1a741b7ea
														
 
															+base_url = https://dashscope.aliyuncs.com/compatible-mode/v1
														
 
															+[moonshot]
														
 
															+api_key = 1111
														
 
															+[zhipu]
														
 
															+api_key = 111
														
 
															+[spark]
														
 
															+api_key = 111
														
 
															+
														
 
															+[baiduocr]
														
 
															+app_id = 11141139
														
 
															+api_key = zaOaRKxp7tH977WPHEkv1YGy
														
 
															+secret_key = gtNP7AIS93YXyYnAv93f6oHkqvcxxAH6
														
--- a/conf/env.conf
+++ b/conf/env.conf
@@ -0,0 +1,68 @@
 
															+[base]
														
 
															+;线上环境配置，请设置环境变量DEMETER_CONF = env
														
 
															+[setting]
														
 
															+name                = 先知控制器
														
 
															+site                = http://diviner.shemic.com/doc/
														
 
															+copyright           = 2024 shemic.com v1.0.0
														
 
															+
														
 
															+;文档转换后 保存的路径 一般用于nginx使用 默认保存到runtime
														
 
															+;save				= /share/files/
														
 
															+
														
 
															+[db]
														
 
															+rdb                 = sqlite
														
 
															+
														
 
															+[sqlite]
														
 
															+file                = diviner
														
 
															+;允许自动建表
														
 
															+create              = True
														
 
															+
														
 
															+[mysql]
														
 
															+host				= web-mysql
														
 
															+port				= 3306
														
 
															+username			= root
														
 
															+password			= 123456
														
 
															+dbname				= diviner
														
 
															+prefix				= oc
														
 
															+charset				= utf8
														
 
															+;允许自动建表
														
 
															+create				= True
														
 
															+
														
 
															+[redis]
														
 
															+host				= web-redis
														
 
															+password			= dm_redis_123
														
 
															+port				= 6379
														
 
															+name				= diviner
														
 
															+prefix				= shemic_
														
 
															+
														
 
															+;定义一些tornado的配置，可为空
														
 
															+[tornado]
														
 
															+
														
 
															+;后台配置
														
 
															+[admin]
														
 
															+port				= 8087
														
 
															+debug				= False
														
 
															+;请求的buffersize
														
 
															+max_buffer_size		= 210763776
														
 
															+;子进程
														
 
															+process				= 0
														
 
															+;定义后台父级菜单
														
 
															+menu_parent			= 站点设置:&#xe62e;
														
 
															+;定义后台子级菜单
														
 
															+menu_child			= 站点管理:/site/site,转换文件列表:/site/convert
														
 
															+
														
 
															+;cookie
														
 
															+cookie_secret		= 61oETzKXQAGaYekL5gEmGeJJFuYh7EQnp2XdTP1o/Vo=
														
 
															+login_url			= /user/login
														
 
															+;是否使用安全cookie
														
 
															+xsrf_cookies		= True
														
 
															+
														
 
															+;前台配置
														
 
															+[front]
														
 
															+port				= 8088
														
 
															+debug				= False
														
 
															+;请求的buffersize
														
 
															+max_buffer_size		= 210763776
														
 
															+;子进程
														
 
															+process				= 30
														
 
															+;支持手机版
														
 
															+mobile				= True
														
--- a/cron.py
+++ b/cron.py
@@ -0,0 +1,3 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from demeter.core import *
														
 
															+Demeter.service('loader').start()
														
--- a/data/04、Frog
+++ b/data/04、Frog
--- a/Hungry/page10_img_0.png
+++ b/Hungry/page10_img_0.png
--- a/Hungry/page11_img_0.png
+++ b/Hungry/page11_img_0.png
--- a/Hungry/page12_img_0.png
+++ b/Hungry/page12_img_0.png
--- a/Hungry/page16_img_4.png
+++ b/Hungry/page16_img_4.png
--- a/Hungry/page1_img_3.png
+++ b/Hungry/page1_img_3.png
--- a/Hungry/page2_img_1.png
+++ b/Hungry/page2_img_1.png
--- a/Hungry/page3_img_0.png
+++ b/Hungry/page3_img_0.png
--- a/Hungry/page4_img_0.png
+++ b/Hungry/page4_img_0.png
--- a/Hungry/page5_img_0.png
+++ b/Hungry/page5_img_0.png
--- a/Hungry/page6_img_0.png
+++ b/Hungry/page6_img_0.png
--- a/Hungry/page7_img_0.png
+++ b/Hungry/page7_img_0.png
--- a/Hungry/page8_img_0.png
+++ b/Hungry/page8_img_0.png
--- a/Hungry/page9_img_0.png
+++ b/Hungry/page9_img_0.png
--- a/data/24、Extreme
+++ b/data/24、Extreme
--- a/data/76、
+++ b/data/76、
--- a/diviner
+++ b/diviner
--- a/front.py
+++ b/front.py
@@ -0,0 +1,10 @@
 
															+#!/usr/bin/env python
														
 
															+# -*- coding: utf-8 -*-
														
 
															+"""
														
 
															+    demeter web
														
 
															+    name:front.py
														
 
															+"""
														
 
															+from demeter.core import *
														
 
															+
														
 
															+if __name__ == "__main__":
														
 
															+	Demeter.webInit('front')
														
--- a/front/__init__.py
+++ b/front/__init__.py
@@ -0,0 +1 @@
 
															+# -*- coding: utf-8 -*-
														
--- a/front/api/__init__.py
+++ b/front/api/__init__.py
@@ -0,0 +1 @@
 
															+# -*- coding: utf-8 -*-
														
--- a/front/api/__load__.py
+++ b/front/api/__load__.py
@@ -0,0 +1,4 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from demeter.web import *
														
 
															+
														
 
															+#可以在此定义一些核心类库
														
--- a/front/api/main.py
+++ b/front/api/main.py
@@ -0,0 +1,24 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+
														
 
															+# 请求处理 /main/loader 接口必须后端获取，token不允许暴露
														
 
															+#http://192.168.33.10:8088/main/loader?signature=44e3cd684a9fe697792a235c8c57838211f5823a&appid=mo1209&nonce=1529659172&method=extract&site_id=1&uid=1&source_id=1&source=
														
 
															+class loader_path(Base):
														
 
															+	@Web.setting
														
 
															+	def get(self):
														
 
															+		# 这里定义开放的功能
														
 
															+		config = {
														
 
															+			'extract': ['parser', 'extract']
														
 
															+		}
														
 
															+		method = self.input('method')
														
 
															+		param = self.request.arguments
														
 
															+		if method in config:
														
 
															+			site = Demeter.service('auth').init(param)
														
 
															+			if isinstance(site, str):
														
 
															+				self.out('no', site)
														
 
															+			else:
														
 
															+				method = config[method]
														
 
															+				param['sync'] = False
														
 
															+				Demeter.service('loader').get(obj=method[0], module=method[1], **param)
														
 
															+		else:
														
 
															+			self.out('no', 'method error')
														
--- a/front/main.py
+++ b/front/main.py
@@ -0,0 +1,4 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from demeter.web import *
														
 
															+import front.api
														
 
															+Web.start(application=[front.api])
														
--- a/install.py
+++ b/install.py
@@ -0,0 +1,25 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from demeter.core import *
														
 
															+
														
 
															+#CREATE DATABASE IF NOT EXISTS yourdbname DEFAULT CHARSET utf8 COLLATE utf8_general_ci;
														
 
															+def manage():
														
 
															+	model = Demeter.model('manage_admin')
														
 
															+	model.id = 1
														
 
															+	info = model.select(type='fetchone')
														
 
															+	if not info:
														
 
															+		model.role_id = 1
														
 
															+		model.username = 'admin'
														
 
															+		model.mobile = '15810090845'
														
 
															+		model.password = '123456'
														
 
															+		model.insert()
														
 
															+
														
 
															+	model = Demeter.model('manage_role')
														
 
															+	model.id = 1
														
 
															+	info = model.select(type='fetchone')
														
 
															+	if not info:
														
 
															+		model.name = u'管理员'
														
 
															+		model.insert()
														
 
															+
														
 
															+manage()
														
 
															+
														
 
															+Demeter.echo('install success!')
														
--- a/loader.py
+++ b/loader.py
@@ -0,0 +1,14 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from demeter.core import *
														
 
															+
														
 
															+# 命令行传参 python loader.py -o parser -m extract -i 1
														
 
															+param = {}
														
 
															+param['obj'] = 'o'
														
 
															+param['module'] = 'm'
														
 
															+param['id'] = 'i'
														
 
															+Demeter.getopt(param)
														
 
															+
														
 
															+obj = Demeter.option['obj']
														
 
															+module = Demeter.option['module']
														
 
															+id = Demeter.option['id']
														
 
															+Demeter.service('loader').get(obj=obj, module=module, sync=True, id=id)
														
--- a/master_cron.py
+++ b/master_cron.py
@@ -0,0 +1,56 @@
 
															+#!/usr/bin/env python
														
 
															+# -*- coding: utf-8 -*-
														
 
															+# 用于批量处理转换 运行多个转换容器
														
 
															+# nohup python /data/dm/container/web/master.py 2>/dev/null &
														
 
															+import time
														
 
															+import subprocess
														
 
															+import os
														
 
															+import pprint
														
 
															+timeSleep = 120
														
 
															+
														
 
															+def redis():
														
 
															+        import redis
														
 
															+        host = '0.0.0.0'
														
 
															+        port = 6379
														
 
															+        password = 'dm_redis_123'
														
 
															+        pool = redis.ConnectionPool(host=host, password=password, port=int(port))
														
 
															+        return redis.Redis(connection_pool=pool)
														
 
															+
														
 
															+def command(file):
														
 
															+        #return 'dm call office-convert_call id=' + file
														
 
															+        return 'docker run -d -it --entrypoint python --rm -v /data/dm/container/share:/share -v /etc/hosts:/etc/hosts.main --env HOSTIP="172.30.0.6" --net=dm -v /data/dm/container/web:/www -v /data/dm/container/web/convert/static:/usr/local/convert/front/static -v /data/dm/container/web/convert/files:/usr/local/convert/runtime/files registry.cn-hangzhou.aliyuncs.com/shemic/convert  /usr/local/convert/convert.py -f ' + file
														
 
															+
														
 
															+def popen(command, bg=False):
														
 
															+        string = command
														
 
															+        if bg == True:
														
 
															+                command = command + ' &'
														
 
															+        process = os.popen(command)
														
 
															+        output = process.read()
														
 
															+        process.close()
														
 
															+        return output
														
 
															+
														
 
															+# 文档转换
														
 
															+def convert():
														
 
															+        check = 'ps -ef | grep master_cron.py | grep -v grep | wc -l'
														
 
															+        value = int(popen(check))
														
 
															+        if value > 1:
														
 
															+                return 1;
														
 
															+        r = redis()
														
 
															+        c = 'office_file'
														
 
															+        i = 0
														
 
															+        # r.ltrim("list2", 0, 1)
														
 
															+        # n = r.llen(c)
														
 
															+        while 1:
														
 
															+                file = r.lpop(c)
														
 
															+                if file:
														
 
															+                        g = command(file)
														
 
															+                        popen(g, False)
														
 
															+                i = i+1
														
 
															+                if i >= 10:
														
 
															+                        time.sleep(timeSleep)
														
 
															+                        i = 0
														
 
															+
														
 
															+def handle():
														
 
															+        convert()
														
 
															+
														
 
															+handle()
														
--- a/model/__init__.py
+++ b/model/__init__.py
@@ -0,0 +1 @@
 
															+# -*- coding: utf-8 -*-
														
--- a/model/__load__.py
+++ b/model/__load__.py
@@ -0,0 +1,7 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+"""
														
 
															+    demeter database
														
 
															+    name:__load__.py
														
 
															+"""
														
 
															+from demeter.model import *
														
 
															+from demeter.core import *
														
--- a/model/data.py
+++ b/model/data.py
@@ -0,0 +1,13 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+
														
 
															+class Data(Model):
														
 
															+    __table__ = 'data'
														
 
															+    __comment__ = '知识库'
														
 
															+    id = Fields(type='int', primaryKey=True, autoIncrement=True, comment='ID')
														
 
															+    site_id = Fields(type='int', comment='所属站点')
														
 
															+    role_id = Fields(type='int', comment='角色id')
														
 
															+    uid = Fields(type='int', comment='用户ID', default='-1')
														
 
															+    name = Fields(type='varchar(32)', comment='知识库标识')
														
 
															+    state = Fields(type='boolean', default='True', comment='数据存在状态')
														
 
															+    cdate = Fields(type='int', default='time', comment='创建时间')
														
--- a/model/extract.py
+++ b/model/extract.py
@@ -0,0 +1,25 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+
														
 
															+class Extract(Model):
														
 
															+    __table__ = 'extract'
														
 
															+    __comment__ = '提取文件内容'
														
 
															+    id = Fields(type='int', primaryKey=True, autoIncrement=True, comment='ID')
														
 
															+    site_id = Fields(type='int', comment='所属站点')
														
 
															+    uid = Fields(type='varchar(200)', comment='上传者')
														
 
															+    source_id = Fields(type='int(11)', comment='源文件id')
														
 
															+    source = Fields(type='varchar(500)', comment='源文件')
														
 
															+    notify = Fields(type='varchar(2000)', comment='回调地址')
														
 
															+    name = Fields(type='varchar(200)', comment='文件名')
														
 
															+    page = Fields(type='int(11)', comment='页数')
														
 
															+    # 这里加索引
														
 
															+    key = Fields(type='varchar(100)', index='search', comment='文件key')
														
 
															+    ext = Fields(type='varchar(20)', comment='后缀名')
														
 
															+    size = Fields(type='varchar(200)', comment='源文件大小')
														
 
															+
														
 
															+    file = Fields(type='varchar(200)', comment='本地地址')
														
 
															+    path = Fields(type='varchar(200)', comment='本地资源目录')
														
 
															+
														
 
															+    state = Fields(type='boolean', default='True', comment='数据存在状态')
														
 
															+    status = Fields(type='tinyint', default='1', comment='转换状态1待机2提取中3提取完成4提取失败')
														
 
															+    cdate = Fields(type='int', default='time', comment='创建时间')
														
--- a/model/extract_content.py
+++ b/model/extract_content.py
@@ -0,0 +1,12 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+
														
 
															+class Extract_content(Model):
														
 
															+    __table__ = 'extract_content'
														
 
															+    __comment__ = 'pdf内容'
														
 
															+    id = Fields(type='int', primaryKey=True, autoIncrement=True, comment='ID')
														
 
															+    extract_id = Fields(type='int', comment='文件id')
														
 
															+    method = Fields(type='tinyint(1)', comment='方法')
														
 
															+    content = Fields(type='text(255)', comment='内容')
														
 
															+    state = Fields(type='boolean', default='True', comment='数据存在状态')
														
 
															+    cdate = Fields(type='int', default='time', comment='创建时间')
														
--- a/model/file.py
+++ b/model/file.py
@@ -0,0 +1,13 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+
														
 
															+class File(Model):
														
 
															+    __table__ = 'file'
														
 
															+    __comment__ = '知识库'
														
 
															+    id = Fields(type='int', primaryKey=True, autoIncrement=True, comment='ID')
														
 
															+    site_id = Fields(type='int', comment='所属站点')
														
 
															+    role_id = Fields(type='int', comment='角色id')
														
 
															+    uid = Fields(type='int', comment='用户ID', default='-1')
														
 
															+    name = Fields(type='varchar(32)', comment='知识库标识')
														
 
															+    state = Fields(type='boolean', default='True', comment='数据存在状态')
														
 
															+    cdate = Fields(type='int', default='time', comment='创建时间')
														
--- a/model/lang_model.py
+++ b/model/lang_model.py
@@ -0,0 +1,13 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+
														
 
															+class Lang_model(Model):
														
 
															+	__table__ = 'lang_model'
														
 
															+	__comment__ = '语言模型表'
														
 
															+	id = Fields(type='int', primaryKey=True, autoIncrement=True, comment='站点ID')
														
 
															+	name = Fields(type='varchar(50)', comment='模型名称')
														
 
															+	channel = Fields(type='varchar(20)', comment='模型渠道', default='baidu')
														
 
															+	model = Fields(type='varchar(100)', comment='模型名称', default='ernie-speed-128k')
														
 
															+	status = Fields(type='tinyint', default='1', comment='状态：1是正常2是不可用')
														
 
															+	state = Fields(type='boolean', default='True', comment='数据存在状态')
														
 
															+	cdate = Fields(type='int', default='time', comment='创建时间')
														
--- a/model/role.py
+++ b/model/role.py
@@ -0,0 +1,17 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+
														
 
															+class Role(Model):
														
 
															+    __table__ = 'role'
														
 
															+    __comment__ = '角色表'
														
 
															+    id = Fields(type='int', primaryKey=True, autoIncrement=True, comment='ID')
														
 
															+    site_id = Fields(type='int', comment='所属站点')
														
 
															+    create_uid = Fields(type='int', comment='创建人ID', default='-1')
														
 
															+    owner_uid = Fields(type='int', comment='持有人ID', default='-1')
														
 
															+    name = Fields(type='varchar(500)', comment='名称')
														
 
															+    lang_model_id = Fields(type='int(11)', comment='模型ID', default='1')
														
 
															+    persona = Fields(type='text', comment='人设提示词', default='')
														
 
															+    use_num = Fields(type='int', comment='使用次数')
														
 
															+    status = Fields(type='tinyint', default='1', comment='角色状态：1是正常2是冻结')
														
 
															+    state = Fields(type='boolean', default='True', comment='数据存在状态')
														
 
															+    cdate = Fields(type='int', default='time', comment='创建时间')
														
--- a/model/role_data.py
+++ b/model/role_data.py
@@ -0,0 +1,30 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+
														
 
															+class Role_data(Model):
														
 
															+    __table__ = 'role_data'
														
 
															+    __comment__ = '角色知识库'
														
 
															+    id = Fields(type='int', primaryKey=True, autoIncrement=True, comment='ID')
														
 
															+    role_id = Fields(type='int', comment='角色id')
														
 
															+    data_id = Fields(type='int', comment='数据文件id')
														
 
															+    state = Fields(type='boolean', default='True', comment='数据存在状态')
														
 
															+    cdate = Fields(type='int', default='time', comment='创建时间')
														
 
															+    
														
 
															+    def getCur(self, id):
														
 
															+        self.id = id
														
 
															+        data = self.select(type='fetchone')
														
 
															+        return data
														
 
															+
														
 
															+    def getList(self, page = 1, param = {}):
														
 
															+        cate = Demeter.model('video_cate').getCur()
														
 
															+        self.cate_id = cate['id']
														
 
															+        Demeter.config['page'] = {}
														
 
															+        Demeter.config['page']['current'] = page
														
 
															+        data = self.select(page=True)
														
 
															+        result = []
														
 
															+        if data:
														
 
															+            for key, value in enumerate(data):
														
 
															+                #cate = Demeter.service('common').one('video_cate', id=value['cate_id'])
														
 
															+                value['cdate'] = Demeter.date(value['cdate'])
														
 
															+                result.append([str(value['id']), value['name'], value['cdate'], ''])
														
 
															+        return result
														
--- a/model/role_sample.py
+++ b/model/role_sample.py
@@ -0,0 +1,12 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+
														
 
															+class User_data(Model):
														
 
															+    __table__ = 'user_data'
														
 
															+    __comment__ = '用户数据'
														
 
															+    id = Fields(type='int', primaryKey=True, autoIncrement=True, comment='ID')
														
 
															+    site_id = Fields(type='int', comment='所属站点')
														
 
															+    role_id = Fields(type='int', comment='角色id')
														
 
															+    content = Fields(type='text', comment='内容', default='')
														
 
															+    state = Fields(type='boolean', default='True', comment='数据存在状态')
														
 
															+    cdate = Fields(type='int', default='time', comment='创建时间')
														
--- a/model/signature.py
+++ b/model/signature.py
@@ -0,0 +1,14 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+"""
														
 
															+    demeter database
														
 
															+    name:signature.py
														
 
															+"""
														
 
															+from .__load__ import *
														
 
															+
														
 
															+class Signature(Model):
														
 
															+	__table__ = 'signature'
														
 
															+	__comment__ = 'signature记录表'
														
 
															+	id = Fields(type='int', primaryKey=True, autoIncrement=True, comment='ID')
														
 
															+	site_id = Fields(type='int', comment='所属站点')
														
 
															+	signature = Fields(type='varchar(500)', comment='signature')
														
 
															+	cdate = Fields(type='int', default='time', comment='创建时间')
														
--- a/model/site.py
+++ b/model/site.py
@@ -0,0 +1,16 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+
														
 
															+class Site(Model):
														
 
															+	__table__ = 'site'
														
 
															+	__comment__ = '站点主表'
														
 
															+	id = Fields(type='int', primaryKey=True, autoIncrement=True, comment='站点ID')
														
 
															+	name = Fields(type='varchar(50)', comment='站点名')
														
 
															+	link = Fields(type='varchar(200)', comment='站点网址')
														
 
															+	appid = Fields(type='varchar(150)', comment='appid')
														
 
															+	appsecret = Fields(type='varchar(300)', comment='appsecret')
														
 
															+	sdate = Fields(type='int', comment='开始时间')
														
 
															+	edate = Fields(type='int', comment='结束时间')
														
 
															+	api = Fields(type='varchar(2000)', comment='接口地址')
														
 
															+	state = Fields(type='boolean', default='True', comment='数据存在状态')
														
 
															+	cdate = Fields(type='int', default='time', comment='创建时间')
														
--- a/model/user.py
+++ b/model/user.py
@@ -0,0 +1,12 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+
														
 
															+class User(Model):
														
 
															+    __table__ = 'user'
														
 
															+    __comment__ = '用户表'
														
 
															+    id = Fields(type='int', primaryKey=True, autoIncrement=True, comment='ID')
														
 
															+    site_id = Fields(type='int', comment='所属站点')
														
 
															+    site_uid = Fields(type='varchar(200)', comment='站点用户ID')
														
 
															+    name = Fields(type='varchar(500)', comment='用户名称')
														
 
															+    state = Fields(type='boolean', default='True', comment='数据存在状态')
														
 
															+    cdate = Fields(type='int', default='time', comment='创建时间')
														
--- a/model/user_data.py
+++ b/model/user_data.py
@@ -0,0 +1,14 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+
														
 
															+class User_data(Model):
														
 
															+    __table__ = 'user_data'
														
 
															+    __comment__ = '用户数据'
														
 
															+    id = Fields(type='int', primaryKey=True, autoIncrement=True, comment='ID')
														
 
															+    site_id = Fields(type='int', comment='所属站点')
														
 
															+    role_id = Fields(type='int', comment='角色id')
														
 
															+    uid = Fields(type='int', comment='用户ID', default='-1')
														
 
															+    name = Fields(type='varchar(32)', comment='知识库标识')
														
 
															+    content = Fields(type='text', comment='内容', default='')
														
 
															+    state = Fields(type='boolean', default='True', comment='数据存在状态')
														
 
															+    cdate = Fields(type='int', default='time', comment='创建时间')
														
--- a/model/user_history.py
+++ b/model/user_history.py
@@ -0,0 +1,15 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+
														
 
															+class User_history(Model):
														
 
															+    __table__ = 'user_data'
														
 
															+    __comment__ = '用户历史对话'
														
 
															+    id = Fields(type='int', primaryKey=True, autoIncrement=True, comment='ID')
														
 
															+    site_id = Fields(type='int', comment='所属站点')
														
 
															+    role_id = Fields(type='int', comment='角色id')
														
 
															+    uid = Fields(type='int', comment='用户ID', default='-1')
														
 
															+    user_input = Fields(type='text', comment='用户输入', default='')
														
 
															+    ai_response = Fields(type='text', comment='AI响应', default='')
														
 
															+    summary = Fields(type='text', comment='摘要', default='')
														
 
															+    state = Fields(type='boolean', default='True', comment='数据存在状态')
														
 
															+    cdate = Fields(type='int', default='time', comment='创建时间')
														
--- a/pdf.py
+++ b/pdf.py
@@ -0,0 +1,18 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from demeter.core import *
														
 
															+
														
 
															+# 测试转换pdf python convert.py -f file.doc
														
 
															+param = {}
														
 
															+param['file'] = 'f'
														
 
															+Demeter.getopt(param)
														
 
															+
														
 
															+#file = Demeter.option['file']
														
 
															+file = 'D://work/ai/diviner/dev/data/04、Frog Is Hungry.pdf'
														
 
															+# pdf提取功能
														
 
															+
														
 
															+# 直接提取
														
 
															+#result = Demeter.service('loader', 'extract').get(file).json()
														
 
															+
														
 
															+# 用通用方法 同步提取并记录已提取，下次直接用提取后的内容
														
 
															+result = Demeter.service('loader').get(obj='parser', module='extract', sync=False, site_id=1, uid=1, source_id=1, source=file, method='json')
														
 
															+print(result)
														
--- a/requirements.txt
+++ b/requirements.txt
@@ -0,0 +1,15 @@
 
															+demeter-lib
														
 
															+redis
														
 
															+requests
														
 
															+gevent
														
 
															+PyMuPDF
														
 
															+langchain
														
 
															+langchain_community
														
 
															+langchain-huggingface
														
 
															+langgraph
														
 
															+zhipuai
														
 
															+openai
														
 
															+faiss-cpu
														
 
															+transformers
														
 
															+edge-tts>=6.1.3
														
 
															+pysrt>=1.1.2
														
--- a/runtime/__init__.py
+++ b/runtime/__init__.py
@@ -0,0 +1,6 @@
 
															+#!/usr/bin/env python
														
 
															+# -*- coding: utf-8 -*-
														
 
															+"""
														
 
															+    demeter init
														
 
															+    author:rabin
														
 
															+"""
														
--- a/runtime/sqlite/extract
+++ b/runtime/sqlite/extract
@@ -0,0 +1 @@
 
															+[["id", 1], ["site_id", 1], ["uid", 1], ["source_id", 1], ["source", 1], ["name", 1], ["page", 1], ["key", 1], ["ext", 1], ["size", 1], ["file", 1], ["path", 1], ["state", 1], ["status", 1], ["cdate", 1]]
														
--- a/runtime/sqlite/extract_content
+++ b/runtime/sqlite/extract_content
@@ -0,0 +1 @@
 
															+[["id", 1], ["extract_id", 1], ["method", 1], ["content", 1], ["state", 1], ["cdate", 1]]
														
--- a/runtime/sqlite/site
+++ b/runtime/sqlite/site
@@ -0,0 +1 @@
 
															+[["id", 1], ["name", 1], ["link", 1], ["appid", 1], ["appsecret", 1], ["sdate", 1], ["edate", 1], ["api", 1], ["state", 1], ["cdate", 1]]
														
--- a/service/__init__.py
+++ b/service/__init__.py
@@ -0,0 +1 @@
 
															+# -*- coding: utf-8 -*-
														
--- a/service/__load__.py
+++ b/service/__load__.py
@@ -0,0 +1,6 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from demeter.core import *
														
 
															+from datetime import *
														
 
															+import uuid
														
 
															+import os
														
 
															+import os.path
														
--- a/service/agent/agent.py
+++ b/service/agent/agent.py
@@ -0,0 +1,23 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+from langchain_core.language_models.chat_models import HumanMessage
														
 
															+from langchain_core.prompts import ChatPromptTemplate
														
 
															+from langchain_core.output_parsers import StrOutputParser
														
 
															+
														
 
															+class Chat(object):
														
 
															+
														
 
															+    chain = False
														
 
															+    def say(self, content):
														
 
															+        return [HumanMessage(content=content)]
														
 
															+
														
 
															+    def set(self, prompts = []):
														
 
															+        chain = ChatPromptTemplate.from_messages(prompts)
														
 
															+        if not self.chain:
														
 
															+            self.chain = chain
														
 
															+        else:
														
 
															+            self.chain = self.chain | chain
														
 
															+
														
 
															+    def out(self, handle, var = {}):
														
 
															+        chain = self.chain | handle | StrOutputParser()
														
 
															+        for chunk in chain.stream(var):
														
 
															+            print(chunk, end="")
														
--- a/service/agent/init.py
+++ b/service/agent/init.py
@@ -0,0 +1,12 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+from langchain_huggingface import HuggingFaceEmbeddings
														
 
															+class Init(object):
														
 
															+
														
 
															+    def __init__(self):
														
 
															+        model_name = "BAAI/bge-small-zh-v1.5"
														
 
															+        model_kwargs = {"device": "cpu"}
														
 
															+        encode_kwargs = {"normalize_embeddings": True}
														
 
															+        Demeter.embedding = HuggingFaceEmbeddings(
														
 
															+            model_name=model_name, model_kwargs=model_kwargs, encode_kwargs=encode_kwargs
														
 
															+        )
														
--- a/service/agent/rag.py
+++ b/service/agent/rag.py
@@ -0,0 +1,23 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+from langchain_core.language_models.chat_models import HumanMessage
														
 
															+from langchain_core.prompts import ChatPromptTemplate
														
 
															+from langchain_core.output_parsers import StrOutputParser
														
 
															+
														
 
															+class Chat(object):
														
 
															+
														
 
															+    chain = False
														
 
															+    def say(self, content):
														
 
															+        return [HumanMessage(content=content)]
														
 
															+
														
 
															+    def set(self, prompts = []):
														
 
															+        chain = ChatPromptTemplate.from_messages(prompts)
														
 
															+        if not self.chain:
														
 
															+            self.chain = chain
														
 
															+        else:
														
 
															+            self.chain = self.chain | chain
														
 
															+
														
 
															+    def out(self, handle, var = {}):
														
 
															+        chain = self.chain | handle | StrOutputParser()
														
 
															+        for chunk in chain.stream(var):
														
 
															+            print(chunk, end="")
														
--- a/service/agent/role.py
+++ b/service/agent/role.py
@@ -0,0 +1,104 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+from langchain_core.prompts import ChatPromptTemplate
														
 
															+from langchain_core.output_parsers import StrOutputParser
														
 
															+from langchain_core.runnables import RunnablePassthrough
														
 
															+class Role(object):
														
 
															+
														
 
															+    def init(self, site_id, role_id, uid):
														
 
															+        self.info = Demeter.service('common').one('role', id=role_id)
														
 
															+        if self.info:
														
 
															+            self.model = Demeter.service('common').one('lang_model', id=self.info['lang_model_id'])
														
 
															+        self.db = None
														
 
															+        self.piece = None
														
 
															+        #self.memory()
														
 
															+        # 知识库挂载
														
 
															+        data = Demeter.service('data').init(site_id)
														
 
															+        context = data.load('similarity', {'k':5, 'fetch_k':50, 'filter': {'role_id': role_id, 'uid' : uid}})
														
 
															+        #sample = data.load('similarity', {'k':5, 'fetch_k':50, 'filter': {'role_id': role_id, 'uid': 'sample'}})
														
 
															+        print(context)
														
 
															+        self.piece = {"context": context | self.format_docs, "question": RunnablePassthrough()}
														
 
															+        return self
														
 
															+
														
 
															+    # 写入记忆
														
 
															+    def write(self, memory):
														
 
															+        pass
														
 
															+
														
 
															+    # 挂载工具
														
 
															+    def tool(self, tool):
														
 
															+        pass
														
 
															+
														
 
															+    def set(self, prompts):
														
 
															+        chain = ChatPromptTemplate.from_template(prompts)
														
 
															+        if not self.piece:
														
 
															+            self.piece = chain
														
 
															+        else:
														
 
															+            self.piece = self.piece | chain
														
 
															+        return self
														
 
															+
														
 
															+    def out(self, query, type = []):
														
 
															+        if self.info:
														
 
															+            #self.info['persona'] = '你是一个精美时尚杂志社的编辑，根据以下上下文来回答这个问题{context}'
														
 
															+            template = """你是一个精美时尚杂志社的编辑，根据以下上下文来回答这个问题:
														
 
															+
														
 
															+            {context}
														
 
															+
														
 
															+            Question: {question},请用中文输出答案。
														
 
															+            """
														
 
															+
														
 
															+            template = """你是一位专业医生。以下是病人的病例内容，请根据医学规范生成详细分析报告。
														
 
															+
														
 
															+            病例内容：
														
 
															+            {context}
														
 
															+
														
 
															+
														
 
															+            请根据上面提供的病例内容生成报告。根据病人的核心关注需求提供解决方案。
														
 
															+            报告要求：
														
 
															+            1. 核心健康问题汇总
														
 
															+            2. 潜在风险与关联性分析
														
 
															+            3. 综合健康建议
														
 
															+            4. 紧急情况预警
														
 
															+            5. 解决方案
														
 
															+
														
 
															+            请以word格式输出，我好直接生成word。
														
 
															+            """
														
 
															+            
														
 
															+            self.set(template)
														
 
															+            self.model = Demeter.service(self.model['channel'], 'llm').load(model='deepseek-r1', streaming=True)
														
 
															+            full_report = ""
														
 
															+            chain = (self.piece | self.model | StrOutputParser())
														
 
															+            for chunk in chain.stream(query):
														
 
															+                print(chunk, end="")
														
 
															+                full_report += chunk
														
 
															+            #self.save_docx(full_report)
														
 
															+
														
 
															+    def format_docs(self, docs):
														
 
															+        return "\n\n".join([d.page_content for d in docs])
														
 
															+
														
 
															+    def save_docx(self, content):
														
 
															+        patient_id = self.info.get('uid', 'unknown')  # 或者 role_id
														
 
															+        timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
														
 
															+        filename = f"report_{patient_id}_{timestamp}.docx"
														
 
															+        output_dir = "reports"
														
 
															+        os.makedirs(output_dir, exist_ok=True)
														
 
															+        filepath = os.path.join(output_dir, filename)
														
 
															+
														
 
															+        doc = Document()
														
 
															+        doc.add_heading('诊断报告', 0)
														
 
															+        doc.add_paragraph(report_text)
														
 
															+        doc.save(filepath)
														
 
															+
														
 
															+        print(f"\n\n📝 报告已保存为：{filepath}")
														
 
															+
														
 
															+    # 生成角色
														
 
															+    def create(self, site_id, uid, name, persona, lang_model_id, data, tool):
														
 
															+        db = Demeter.db('role')
														
 
															+        db.site_id = site_id
														
 
															+        db.create_uid = create_uid
														
 
															+        db.owner_uid = owner_uid
														
 
															+        db.persona = persona
														
 
															+        db.lang_model_id = lang_model_id
														
 
															+        id = db.insert()
														
 
															+        if len(data) > 0:
														
 
															+            for key, value in enumerate(data):
														
 
															+                pass
														
--- a/service/auth.py
+++ b/service/auth.py
@@ -0,0 +1,74 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+class Auth(object):
														
 
															+    def init(self, param=param, request=False):
														
 
															+        if 'appid' not in param:
														
 
															+            return '参数错误：appid'
														
 
															+        if 'timestamp' not in param:
														
 
															+            return '参数错误：timestamp'
														
 
															+        if 'nonce' not in param:
														
 
															+            return '参数错误：nonce'
														
 
															+        if 'signature' not in param:
														
 
															+            return '参数错误：signature'
														
 
															+
														
 
															+        model = Demeter.model('site')
														
 
															+        model.appid = param['appid']
														
 
															+        site = model.select(type='fetchone')
														
 
															+        if not site:
														
 
															+            return '站点信息不存在'
														
 
															+
														
 
															+        time = Demeter.time()
														
 
															+        if time < site['sdate'] or time > site['edate']:
														
 
															+            return '授权已失效'
														
 
															+        if time - int(param['timestamp']) > 600:
														
 
															+            return '签名已过期'
														
 
															+
														
 
															+        if request:
														
 
															+            # 针对域名做白名单
														
 
															+            referer = request.headers.get("Referer")
														
 
															+            if not referer:
														
 
															+                return '验证失败：来源错误'
														
 
															+
														
 
															+            host = Demeter.host(site['link'])
														
 
															+            if host != Demeter.host(referer):
														
 
															+                return '验证失败：来源错误'
														
 
															+
														
 
															+            uri = self.getHost(request) + request.uri
														
 
															+            if referer == uri:
														
 
															+                return '验证失败：来源错误'
														
 
															+
														
 
															+        param['appsecret'] = site['appsecret']
														
 
															+        if self.signature(param) != signature:
														
 
															+            return '验签失败'
														
 
															+        return site
														
 
															+
														
 
															+    def getHost(self, request):
														
 
															+        host = request.host.replace(':8088', '')
														
 
															+        host = request.protocol + "://" + host
														
 
															+        return host
														
 
															+
														
 
															+    def signature(self, param):
														
 
															+        for k, v in param.items():
														
 
															+            all_params[k] = str(v)
														
 
															+        sorted_items = sorted(all_params.items(), key=lambda x: x[0])
														
 
															+        param_str = "&".join(f"{k}={v}" for k, v in sorted_items)
														
 
															+        return Demeter.md5(param_str)
														
 
															+
														
 
															+
														
 
															+    # sign 只能使用一次 以后再说吧
														
 
															+    def check(self, param):
														
 
															+        model = Demeter.model('signature')
														
 
															+        model.appid = param['appid']
														
 
															+        model.signature = param['signature']
														
 
															+        info = model.select(type='fetchone')
														
 
															+        if info:
														
 
															+            return False
														
 
															+        model.site_id = param['appid']
														
 
															+        model.signature = param['signature']
														
 
															+        model.insert()
														
 
															+
														
 
															+    def clear(self):
														
 
															+        num = Demeter.time() - 3600*24
														
 
															+        model = Demeter.model('signature')
														
 
															+        model.cdate.assign(num, exp='<=')
														
 
															+        model.delete()
														
--- a/service/callback.py
+++ b/service/callback.py
@@ -0,0 +1,19 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+# 回调
														
 
															+class Callback(object):
														
 
															+
														
 
															+    def send(self, site_id, param):
														
 
															+        model = Demeter.model('site')
														
 
															+        model.id = site_id
														
 
															+        site = model.select(type='fetchone')
														
 
															+        if 'notify' in param and param['notify']:
														
 
															+            site['api'] = param['notify']
														
 
															+        if 'api' in site and site['api']:
														
 
															+            api = site['api']
														
 
															+            param['appid'] = site['appid']
														
 
															+            param['appsecret'] = site['appsecret']
														
 
															+            param['timestamp'] = Demeter.time()
														
 
															+            param['nonce'] = Demeter.hash()
														
 
															+            param['signature'] = Dever.service('auth').signature(param)
														
 
															+            Demeter.curl(api, param, 'post')
														
--- a/service/comfyui/comfyui.py
+++ b/service/comfyui/comfyui.py
@@ -0,0 +1,163 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+class Comfyui(object):
														
 
															+
														
 
															+    def info(self, file, check = False):
														
 
															+        output = self.act(file, False, False, check)
														
 
															+        info = {}
														
 
															+        if output:
														
 
															+            # 提取格式信息
														
 
															+            format_info = re.search(r"Input #0, (.*?), from", output)
														
 
															+            if format_info:
														
 
															+                info['format'] = format_info.group(1)
														
 
															+
														
 
															+            # 提取时长信息
														
 
															+            duration_match = re.search(r'Duration: (\d+):(\d+):(\d+).(\d+)', output)
														
 
															+            if duration_match:
														
 
															+                hours = duration_match.group(1)
														
 
															+                minutes = duration_match.group(2)
														
 
															+                seconds = duration_match.group(3)
														
 
															+                milliseconds = duration_match.group(4)
														
 
															+                info['total_seconds'] = int(hours) * 3600 + int(minutes) * 60 + int(seconds) + int(milliseconds) / 100
														
 
															+                info['duration'] = hours + ':' + minutes + ':' + seconds + '.' + milliseconds
														
 
															+
														
 
															+            # 提取比特率信息
														
 
															+            bitrate_info = re.search(r"bitrate: (\d+ kb/s)", output)
														
 
															+            if bitrate_info:
														
 
															+                info['bitrate'] = bitrate_info.group(1)
														
 
															+
														
 
															+            # 提取视频流信息
														
 
															+            video_stream_info = re.search(r"Stream #(\d+:\d+).*: Video: (.*?), (\d+x\d+)", output)
														
 
															+            if video_stream_info:
														
 
															+                info['video_stream'] = video_stream_info.group(1)
														
 
															+                info['video_codec'] = video_stream_info.group(2)
														
 
															+                resolution = video_stream_info.group(3)
														
 
															+                info['resolution'] = resolution
														
 
															+                width, height = resolution.split('x')
														
 
															+                info['width'] = int(width)
														
 
															+                info['height'] = int(height)
														
 
															+
														
 
															+            # 提取音频流信息
														
 
															+            audio_stream_info = re.search(r"Stream #(\d+:\d+).*: Audio: (.*?), (\d+ Hz)", output)
														
 
															+            if audio_stream_info:
														
 
															+                info['audio_stream'] = audio_stream_info.group(1)
														
 
															+                info['audio_codec'] = audio_stream_info.group(2)
														
 
															+                info['audio_sample_rate'] = audio_stream_info.group(3)
														
 
															+
														
 
															+            match = re.search(r'(\d+(\.\d+)?) fps', output)
														
 
															+            if match:
														
 
															+                info['fps'] = float(match.group(1))
														
 
															+                info['frame'] = info['fps'] * info['total_seconds']
														
 
															+
														
 
															+        return info
														
 
															+
														
 
															+    def act(self, input, output, option = {}, check = False):
														
 
															+        self.cmd = [Demeter.ffmpeg]
														
 
															+        self.cmd.append(self.input(input))
														
 
															+        if option:
														
 
															+            for k, v in option.items():
														
 
															+                if not isinstance(v, list):
														
 
															+                    v = [v]
														
 
															+                method = getattr(self, k)
														
 
															+                self.cmd.append(method(*v))
														
 
															+
														
 
															+        if output:
														
 
															+            self.cmd.append(self.output(output))
														
 
															+        cmd = self.implode(' ', self.cmd)
														
 
															+        if check:
														
 
															+            print(cmd);
														
 
															+            return
														
 
															+        result = subprocess.run(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True, bufsize=1, encoding='latin-1')
														
 
															+        return result.stderr
														
 
															+
														
 
															+    # 获取视频
														
 
															+    def input(self, video):
														
 
															+        if isinstance(video, dict):
														
 
															+            return self.option(video['option'], ' -i ' + video['file'])
														
 
															+        return '-i "' + video + '"'
														
 
															+
														
 
															+    # 输出视频
														
 
															+    def output(self, video):
														
 
															+        #'-b:v 10000k'
														
 
															+        if isinstance(video, dict):
														
 
															+            return self.option(video['option'], ' ' + video['file'])
														
 
															+        return '-y ' + video
														
 
															+
														
 
															+    # 按照时间截取
														
 
															+    def time(self, max, start = 0):
														
 
															+        return '-ss ' + self.gmdate('%H:%M:%S', start) + ' -t ' + self.gmdate('%H:%M:%S', max)
														
 
															+
														
 
															+    # video过滤器
														
 
															+    def video(self, video):
														
 
															+        if video:
														
 
															+            cmd = []
														
 
															+            for k, v in video.items():
														
 
															+                cmd.append(self.filter('video', k, v))
														
 
															+            return '-vf "'+self.implode(',', cmd)+'"'
														
 
															+        return ''
														
 
															+
														
 
															+    # audio过滤器
														
 
															+    def audio(self, audio):
														
 
															+        if video:
														
 
															+            cmd = []
														
 
															+            for k, v in audio.items():
														
 
															+                cmd.append(self.filter('audio', k, v))
														
 
															+            return '-af "'+self.implode(',', cmd)+'"'
														
 
															+        return ''
														
 
															+
														
 
															+    # 复杂过滤器
														
 
															+    def filter_complex(self, param):
														
 
															+        cmd = []
														
 
															+        for k, v in param.items():
														
 
															+            cmd.append(v)
														
 
															+        return '-filter_complex "'+self.implode(';', cmd)+'"'
														
 
															+
														
 
															+    # 过滤器 -简单过滤器
														
 
															+    def filter(self, type, method, param):
														
 
															+        service = Demeter.service(type, 'filter')
														
 
															+        if hasattr(service, method):
														
 
															+            method = getattr(service, method)
														
 
															+            if not isinstance(param, list):
														
 
															+                param = [param]
														
 
															+            return method(*param)
														
 
															+        else:
														
 
															+            if isinstance(param, list):
														
 
															+                tmp = []
														
 
															+                for k, v in param.items():
														
 
															+                    if v:
														
 
															+                        v = '=' + v
														
 
															+                    tmp.append(k + v)
														
 
															+                param = self.implode(':', tmp)
														
 
															+            if param:
														
 
															+                param = '=' + param
														
 
															+            return method + param
														
 
															+
														
 
															+    # 获取选项
														
 
															+    def option(self, option, suffix = ''):
														
 
															+        tmp = []
														
 
															+        if option:
														
 
															+            for k, v in option.items():
														
 
															+                if v:
														
 
															+                    v = ' ' + v
														
 
															+                if isinstance(k, str) and k:
														
 
															+                    tmp.append('-' + self.alias(k) + v)
														
 
															+                else:
														
 
															+                    tmp.append(v)
														
 
															+        return self.implode(' ', tmp) + suffix
														
 
															+
														
 
															+    # 设置别名
														
 
															+    def alias(self, k):
														
 
															+        if k == 'audio':
														
 
															+            return 'b:a'
														
 
															+        if k == 'video':
														
 
															+            return 'b:v'
														
 
															+        return k
														
 
															+
														
 
															+    def implode(self, stn, lst):
														
 
															+        return stn.join(map(str, lst))
														
 
															+
														
 
															+    def gmdate(self, format, start):
														
 
															+        # 将给定的时间戳转换为 datetime 对象
														
 
															+        dt = datetime.fromtimestamp(start, tz=timezone.utc)
														
 
															+        # 使用 strftime 方法格式化 datetime 对象
														
 
															+        return dt.strftime(format)
														
--- a/service/data/__init__.py
+++ b/service/data/__init__.py
@@ -0,0 +1 @@
 
															+# -*- coding: utf-8 -*-
														
--- a/service/data/db.py
+++ b/service/data/db.py
@@ -0,0 +1,28 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+from langchain_community.vectorstores import FAISS
														
 
															+
														
 
															+class Db(object):
														
 
															+
														
 
															+    def __init__(self):
														
 
															+        Demeter.service('init')
														
 
															+        self.embedding = Demeter.embedding
														
 
															+        self.path = File.path() + 'data/db/'
														
 
															+
														
 
															+    def write(self, id, data):
														
 
															+        name = self.name(id)
														
 
															+        if File.exists(name):
														
 
															+            db = FAISS.load_local(name, embeddings=self.embedding, allow_dangerous_deserialization=True)
														
 
															+            db.add_documents(data)
														
 
															+        else:
														
 
															+            db = FAISS.from_documents(data, embedding=self.embedding)
														
 
															+        db.save_local(name)
														
 
															+        return db
														
 
															+
														
 
															+    def read(self, id):
														
 
															+        db = FAISS.load_local(self.name(id), embeddings=self.embedding, allow_dangerous_deserialization=True)
														
 
															+        return db
														
 
															+
														
 
															+    def name(self, name):
														
 
															+        name = str(name)
														
 
															+        return File.dest(self.path, Demeter.md5(name))
														
--- a/service/data/faiss.py
+++ b/service/data/faiss.py
@@ -0,0 +1,28 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+from langchain_community.vectorstores import FAISS
														
 
															+
														
 
															+class Db(object):
														
 
															+
														
 
															+    def __init__(self):
														
 
															+        Demeter.service('init')
														
 
															+        self.embedding = Demeter.embedding
														
 
															+        self.path = File.path() + 'data/db/'
														
 
															+
														
 
															+    def write(self, id, data):
														
 
															+        name = self.name(id)
														
 
															+        if File.exists(name):
														
 
															+            db = FAISS.load_local(name, embeddings=self.embedding, allow_dangerous_deserialization=True)
														
 
															+            db.add_documents(data)
														
 
															+        else:
														
 
															+            db = FAISS.from_documents(data, embedding=self.embedding)
														
 
															+        db.save_local(name)
														
 
															+        return db
														
 
															+
														
 
															+    def read(self, id):
														
 
															+        db = FAISS.load_local(self.name(id), embeddings=self.embedding, allow_dangerous_deserialization=True)
														
 
															+        return db
														
 
															+
														
 
															+    def name(self, name):
														
 
															+        name = str(name)
														
 
															+        return File.dest(self.path, Demeter.md5(name))
														
--- a/service/extract/__init__.py
+++ b/service/extract/__init__.py
@@ -0,0 +1 @@
 
															+# -*- coding: utf-8 -*-
														
--- a/service/extract/__load__.py
+++ b/service/extract/__load__.py
@@ -0,0 +1,6 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from demeter.core import *
														
 
															+from datetime import *
														
 
															+import uuid
														
 
															+import os
														
 
															+import os.path
														
--- a/service/extract/docs/__init__.py
+++ b/service/extract/docs/__init__.py
@@ -0,0 +1 @@
 
															+# -*- coding: utf-8 -*-
														
--- a/service/extract/docs/__load__.py
+++ b/service/extract/docs/__load__.py
@@ -0,0 +1,6 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from demeter.core import *
														
 
															+import os
														
 
															+import io
														
 
															+import re
														
 
															+from .base import Base
														
--- a/service/extract/docs/base.py
+++ b/service/extract/docs/base.py
@@ -0,0 +1,27 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+class Base(object):
														
 
															+
														
 
															+    # 初始化
														
 
															+    def init(self, file, param = {}):
														
 
															+        self.file = file
														
 
															+        self.param = param
														
 
															+        return self
														
 
															+
														
 
															+    # 获取路径
														
 
															+    def getPath(self):
														
 
															+        if 'path' not in self.param:
														
 
															+            pdf_dir = os.path.dirname(self.file)
														
 
															+            pdf_name = os.path.splitext(os.path.basename(self.file))[0]
														
 
															+            self.param['path'] = os.path.join(pdf_dir, pdf_name)
														
 
															+            if not os.path.exists(self.param['path']):
														
 
															+                os.makedirs(self.param['path'])
														
 
															+
														
 
															+    # 移除域名
														
 
															+    def removeDomains(self, text):
														
 
															+        # 匹配 URL、域名，包含 http(s)、www、裸域名
														
 
															+        domain_pattern = re.compile(
														
 
															+            r"(https?://[^\s]+|www\.[^\s]+|(?<!@)\b[a-zA-Z0-9.-]+\.[a-zA-Z]{2,}(?!\w))",
														
 
															+            re.IGNORECASE
														
 
															+        )
														
 
															+        return domain_pattern.sub("", text).strip()
														
--- a/service/extract/docs/csv.py
+++ b/service/extract/docs/csv.py
@@ -0,0 +1,9 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+from langchain_community.document_loaders.csv_loader import CSVLoader
														
 
															+
														
 
															+class Csv(object):
														
 
															+
														
 
															+    def run(self, file, param = {}):
														
 
															+        loader = CSVLoader(file_path=file, encoding='utf-8')
														
 
															+        return loader.load()
														
--- a/service/extract/docs/excel.py
+++ b/service/extract/docs/excel.py
@@ -0,0 +1,9 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+from langchain_community.document_loaders import UnstructuredExcelLoader
														
 
															+
														
 
															+class Excel(object):
														
 
															+
														
 
															+    def run(self, file, param = {}):
														
 
															+        loader = UnstructuredExcelLoader(file, mode='elements', **param)
														
 
															+        return loader.load()
														
--- a/service/extract/docs/html.py
+++ b/service/extract/docs/html.py
@@ -0,0 +1,9 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+from langchain_community.document_loaders import UnstructuredHTMLLoader
														
 
															+
														
 
															+class Html(object):
														
 
															+
														
 
															+    def run(self, file, param = {}):
														
 
															+        loader = UnstructuredHTMLLoader(file, encoding='utf-8')
														
 
															+        return loader.load()
														
--- a/service/extract/docs/img.py
+++ b/service/extract/docs/img.py
@@ -0,0 +1,29 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+from langchain_community.document_loaders import UnstructuredImageLoader
														
 
															+from langchain.schema import Document
														
 
															+from aip import AipOcr
														
 
															+#from PIL import Image
														
 
															+#from cnocr import CnOcr
														
 
															+#from pix2text import Pix2Text, merge_line_texts
														
 
															+
														
 
															+class Img(object):
														
 
															+
														
 
															+    def run(self, file, param = {}):
														
 
															+        #loader = UnstructuredImageLoader(file, mode='single', **param)
														
 
															+        #return loader.load()
														
 
															+        with open(file, 'rb') as image_file:
														
 
															+            image_data = image_file.read()
														
 
															+
														
 
															+
														
 
															+        # 初始化AipOcr对象
														
 
															+        client = AipOcr(Demeter.config['baiduocr']['app_id'], Demeter.config['baiduocr']['api_key'], Demeter.config['baiduocr']['secret_key'])
														
 
															+
														
 
															+        # 调用百度OCR接口识别文字
														
 
															+        result = client.basicGeneral(image_data)
														
 
															+        text = ''
														
 
															+        if 'words_result' in result:
														
 
															+            for item in result['words_result']:
														
 
															+                text += item['words'] + '\n'
														
 
															+        data = Document(page_content=text, metadata={"source": "ocr"})
														
 
															+        return data
														
--- a/service/extract/docs/json.py
+++ b/service/extract/docs/json.py
@@ -0,0 +1,10 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+# pip install jq
														
 
															+from .__load__ import *
														
 
															+from langchain_community.document_loaders import JSONLoader
														
 
															+
														
 
															+class Json(object):
														
 
															+
														
 
															+    def run(self, file, param = {}):
														
 
															+        loader = JSONLoader(file_path=file, **param)
														
 
															+        return loader.load()
														
--- a/service/extract/docs/pdf.py
+++ b/service/extract/docs/pdf.py
@@ -0,0 +1,110 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+#from langchain_community.document_loaders import PyPDFLoader
														
 
															+import fitz
														
 
															+#from PIL import Image
														
 
															+class Pdf(Base):
														
 
															+    # 提取为json格式
														
 
															+    def json(self):
														
 
															+        if not self.file:
														
 
															+            return False
														
 
															+        self.getPath()
														
 
															+        doc = fitz.open(self.file)
														
 
															+        page = doc.page_count
														
 
															+        result = {'page': page, 'content': []}
														
 
															+
														
 
															+        for page_num in range(len(doc)):
														
 
															+            page = doc.load_page(page_num)
														
 
															+            page_height = page.rect.height
														
 
															+            blocks = page.get_text("dict", sort=True)["blocks"]
														
 
															+            page_items = []
														
 
															+
														
 
															+            for i, b in enumerate(blocks):
														
 
															+                # 去除页眉页脚：bbox[1] 是顶部Y坐标，bbox[3] 是底部Y坐标
														
 
															+                y_top = b["bbox"][1]
														
 
															+                y_bottom = b["bbox"][3]
														
 
															+                if y_top < page_height * 0.05 or y_bottom > page_height * 0.95:
														
 
															+                    continue
														
 
															+
														
 
															+                if b['type'] == 0:
														
 
															+                    text_content = ""
														
 
															+                    for line in b["lines"]:
														
 
															+                        for span in line["spans"]:
														
 
															+                            span_text = span["text"]
														
 
															+                            text_content += span_text
														
 
															+                        text_content += "\n"
														
 
															+                    text_content = text_content.strip()
														
 
															+                    text_content = self.removeDomains(text_content)
														
 
															+                    if text_content:
														
 
															+                        page_items.append({
														
 
															+                            "type": "text",
														
 
															+                            "pos": b["bbox"],
														
 
															+                            "content": text_content,
														
 
															+                            "page": page_num + 1
														
 
															+                        })
														
 
															+
														
 
															+                elif b['type'] == 1:  # 图片块
														
 
															+                    image_bytes = b.get("image", b"")
														
 
															+                    if not image_bytes or len(image_bytes) < 100:
														
 
															+                        continue
														
 
															+                    try:
														
 
															+                        pix = fitz.Pixmap(doc, b["image"])
														
 
															+                        if pix.width < 10 or pix.height < 10:
														
 
															+                            continue
														
 
															+                    except Exception:
														
 
															+                        pass
														
 
															+                    image_ext = "png"
														
 
															+                    filename = f"{self.param['path']}page{page_num+1}_img_{i}.{image_ext}"
														
 
															+                    with open(filename, "wb") as f:
														
 
															+                        f.write(image_bytes)
														
 
															+
														
 
															+                    page_items.append({
														
 
															+                        "type": "image",
														
 
															+                        "pos": b["bbox"],
														
 
															+                        "ext": image_ext,
														
 
															+                        "filename": filename,
														
 
															+                        "page": page_num + 1,
														
 
															+                    })
														
 
															+
														
 
															+            result['content'].extend(page_items)
														
 
															+        return result
														
 
															+
														
 
															+    # 提取为langchain的Document格式
														
 
															+    def doc(self):
														
 
															+        if not self.file:
														
 
															+            return False
														
 
															+        #loader = PyPDFLoader(self.file, extract_images=False)
														
 
															+        #return loader.load()
														
 
															+        doc = fitz.open(self.file)
														
 
															+        result = {'page': page, 'content': []}
														
 
															+        for page_num in range(len(doc)):
														
 
															+            page = doc.load_page(page_num)
														
 
															+            
														
 
															+            # 提取文本
														
 
															+            text = page.get_text()
														
 
															+
														
 
															+            # 提取图片中的文字
														
 
															+            image_texts = []
														
 
															+            for img in page.get_images(full=True):
														
 
															+                xref = img[0]
														
 
															+                base_image = doc.extract_image(xref)
														
 
															+                image_bytes = base_image["image"]
														
 
															+                image = Image.open(io.BytesIO(image_bytes))
														
 
															+
														
 
															+                #result = Demeter.service('loader', 'extract').get(image)
														
 
															+
														
 
															+                ocr_result = ocr.ocr(image)
														
 
															+                for line in ocr_result[0]:
														
 
															+                    image_texts.append(line[1])
														
 
															+
														
 
															+                '''
														
 
															+                # OCR 识别
														
 
															+                ocr_result = ocr_reader.readtext(image)
														
 
															+                image_texts = " ".join([line[1] for line in ocr_result]).strip()
														
 
															+                '''
														
 
															+
														
 
															+            # 合并文字 + 图片文字
														
 
															+            full_text = text.strip() + "\n" + "\n".join(image_texts)
														
 
															+            document = langchain.schema.Document(page_content=full_text)
														
 
															+            result['content'].append(document)
														
 
															+        return result
														
--- a/service/extract/docs/ppt.py
+++ b/service/extract/docs/ppt.py
@@ -0,0 +1,9 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+from langchain_community.document_loaders import UnstructuredPowerPointLoader
														
 
															+
														
 
															+class Ppt(object):
														
 
															+
														
 
															+    def run(self, file, param = {}):
														
 
															+        loader = UnstructuredPowerPointLoader(file, mode='elements', **param)
														
 
															+        return loader.load()
														
--- a/service/extract/docs/text.py
+++ b/service/extract/docs/text.py
@@ -0,0 +1,9 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+from langchain_community.document_loaders import TextLoader
														
 
															+
														
 
															+class Text(object):
														
 
															+
														
 
															+    def run(self, file, param = {}):
														
 
															+        loader = TextLoader(file, encoding='utf-8')
														
 
															+        return loader.load()
														
--- a/service/extract/docs/web.py
+++ b/service/extract/docs/web.py
@@ -0,0 +1,9 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+from langchain_community.document_loaders import WebBaseLoader
														
 
															+
														
 
															+class Web(object):
														
 
															+
														
 
															+    def run(self, file, param = {}):
														
 
															+        loader = WebBaseLoader(file, **param)
														
 
															+        return loader.load()
														
--- a/service/extract/docs/word.py
+++ b/service/extract/docs/word.py
@@ -0,0 +1,9 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+from langchain_community.document_loaders import UnstructuredWordDocumentLoader
														
 
															+
														
 
															+class Word(object):
														
 
															+
														
 
															+    def run(self, file, param = {}):
														
 
															+        loader = UnstructuredWordDocumentLoader(file, mode='elements', **param)
														
 
															+        return loader.load()
														
--- a/service/extract/extract.py
+++ b/service/extract/extract.py
@@ -0,0 +1,335 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+
														
 
															+class Extract(object):
														
 
															+
														
 
															+    def update(self, site, appid, source_file, source_id, source_type, uid):
														
 
															+
														
 
															+        info = self.getFile(appid, source_file)
														
 
															+
														
 
															+        extract = Demeter.model('extract')
														
 
															+        extract.site_id = site
														
 
															+        extract.key = info['key']
														
 
															+
														
 
															+        data = extract.select(type='fetchone')
														
 
															+        if not data:
														
 
															+            extract.site_id = site
														
 
															+            extract.uid = uid
														
 
															+            extract.key = info['key']
														
 
															+            extract.name = info['name']
														
 
															+            extract.source_id = source_id
														
 
															+            extract.source_type = source_type
														
 
															+            extract.source_size = 0
														
 
															+            extract.source_file = info['source_file']
														
 
															+            extract.local_file = info['local_file']
														
 
															+            extract.local_path = info['local_path']
														
 
															+            id = extract.insert()
														
 
															+            info['status'] = 1
														
 
															+            info['id'] = id
														
 
															+        else:
														
 
															+            info['id'] = data['id']
														
 
															+            info['status'] = data['status']
														
 
															+        if uid:
														
 
															+            self.auth(site, uid, info['id'], 1)
														
 
															+
														
 
															+        return info
														
 
															+
														
 
															+    def getAuth(self, site, uid, extract_id):
														
 
															+        auth = Demeter.model('extract_auth')
														
 
															+        auth.uid = uid
														
 
															+        auth.site_id = site
														
 
															+        auth.extract_id = extract_id
														
 
															+        data = auth.select(type='fetchone')
														
 
															+        return data
														
 
															+
														
 
															+
														
 
															+    def auth(self, site, uid, extract_id, status):
														
 
															+        auth = Demeter.model('extract_auth')
														
 
															+        auth.uid = uid
														
 
															+        auth.site_id = site
														
 
															+        auth.extract_id = extract_id
														
 
															+        data = auth.select(type='fetchone')
														
 
															+        if not data:
														
 
															+            auth.site_id = site
														
 
															+            auth.uid = uid
														
 
															+            auth.extract_id = extract_id
														
 
															+            auth.status = status
														
 
															+            auth.insert()
														
 
															+        elif data['status'] != status:
														
 
															+            # 适用于文档转让
														
 
															+            auth.id = data['id']
														
 
															+            update = {}
														
 
															+            update['status'] = status
														
 
															+            auth.update(update)
														
 
															+
														
 
															+        return True
														
 
															+
														
 
															+    def get(self, site, appid, file):
														
 
															+        extract = Demeter.model('extract')
														
 
															+        extract.site_id = site
														
 
															+        #extract.key = self.getKey(appid, file)
														
 
															+        extract.key = file
														
 
															+        data = extract.select(type='fetchone')
														
 
															+        return data
														
 
															+
														
 
															+    def getKey(self, appid, file):
														
 
															+        return Demeter.sha1(str(appid) + '_' + str(file))
														
 
															+
														
 
															+    def getFile(self, appid, file):
														
 
															+        info = {}
														
 
															+
														
 
															+        (filepath,temp) = os.path.split(file)
														
 
															+        (filename,extension) = os.path.splitext(temp)
														
 
															+
														
 
															+        info['source_file'] = file
														
 
															+        info['key'] = self.getKey(appid, file)
														
 
															+        info['ext'] = extension
														
 
															+        info['name'] = filename
														
 
															+
														
 
															+        info = self.getLocalFile(appid, file, info)
														
 
															+
														
 
															+        return info
														
 
															+
														
 
															+    def getLocalFile(self, appid, file, info):
														
 
															+
														
 
															+        day = str(date.today())
														
 
															+        day = day.split('-')
														
 
															+
														
 
															+        #filename =  Demeter.md5(str(uuid.uuid5(uuid.uuid1(), info['key'])))
														
 
															+        filename =  info['key']
														
 
															+        filepath = str(appid) + '/' + day[0] + '/' + day[1] + '/' + day[2]
														
 
															+        path = ''
														
 
															+
														
 
															+        if 'save' in Demeter.config['setting']:
														
 
															+            filepath = File.mkdirs(os.path.join(Demeter.config['setting']['save'], filepath)) + '/' + filename
														
 
															+        else:
														
 
															+            filepath = File.mkdirs(os.path.join(Demeter.path, 'runtime','files', filepath)) + '/' + filename
														
 
															+
														
 
															+        local = filepath + info['ext']
														
 
															+
														
 
															+        info['local_file'] = local
														
 
															+        info['local_path'] = filepath + '/'
														
 
															+
														
 
															+        return info
														
 
															+        if File.exists(local):
														
 
															+            return info
														
 
															+        else:
														
 
															+            self.download(file, local);
														
 
															+            return info
														
 
															+
														
 
															+    def download(self, file, local):
														
 
															+        if 'http' in file:
														
 
															+            import requests
														
 
															+            r = requests.get(file, stream=True)
														
 
															+            with open(local, 'wb') as up:
														
 
															+                for chunk in r.iter_content(chunk_size=1024):
														
 
															+                    if chunk:
														
 
															+                        up.write(chunk)
														
 
															+
														
 
															+        else:
														
 
															+            import shutil
														
 
															+            shutil.copyfile(file, local)
														
 
															+
														
 
															+        if File.exists(local):
														
 
															+            return True
														
 
															+        return False
														
 
															+
														
 
															+    def total(self, path):
														
 
															+        page = 0
														
 
															+        for parentdir,dirname,filenames in os.walk(path):  
														
 
															+            for filename in filenames:
														
 
															+                if os.path.splitext(filename)[1]=='.page':
														
 
															+                    page = page + 1
														
 
															+        return page
														
 
															+
														
 
															+    def handle(self, id):
														
 
															+        model = Demeter.model('extract')
														
 
															+        model.id = id
														
 
															+        info = model.select(type='fetchone')
														
 
															+
														
 
															+        if not info:
														
 
															+            return
														
 
															+        siteModel = Demeter.model('site')
														
 
															+        siteModel.id = info['site_id']
														
 
															+        site = siteModel.select(type='fetchone')
														
 
															+
														
 
															+        status = True
														
 
															+        if info['status'] == 1 or info['status'] == 4:
														
 
															+            status = False
														
 
															+
														
 
															+        if info and status == False:
														
 
															+            model.id = id
														
 
															+            update = {}
														
 
															+            update['status'] = 2
														
 
															+            model.update(update)
														
 
															+
														
 
															+            if not File.exists(info['local_file']):
														
 
															+                self.download(info['source_file'], info['local_file'])
														
 
															+
														
 
															+            if True:
														
 
															+                File.mkdir(info['local_path'])
														
 
															+
														
 
															+                Demeter.service(info['ext'], 'docs').load(info)
														
 
															+
														
 
															+
														
 
															+                if 'txt' in info['ext']:
														
 
															+                    import chardet
														
 
															+                    file_path = info['local_file']
														
 
															+                    with open(file_path, 'rb') as fp:
														
 
															+                        file_data = fp.read()
														
 
															+                        result = chardet.detect(file_data)
														
 
															+                        fp.close()
														
 
															+                        if result['encoding'] != 'utf-8':
														
 
															+                            file_content = file_data.decode(result['encoding'])
														
 
															+                            f = open(file_path, 'w')
														
 
															+                            f.write(file_content)
														
 
															+                            f.close()
														
 
															+                if 'pdf' in info['ext']:
														
 
															+
														
 
															+                handle = self.command(info)
														
 
															+                Shell.popen(handle)
														
 
															+                if File.exists(info['html']):
														
 
															+
														
 
															+                    # 处理图片
														
 
															+                    self.pic(info)
														
 
															+                    #self.string_switch(info['html'], "taste", "tasting")
														
 
															+                    # 获取有多少页
														
 
															+                    page = self.total(info['path'])
														
 
															+                    model.id = id
														
 
															+                    size = os.path.getsize(info['local'])
														
 
															+                    update = {}
														
 
															+                    update['file_size'] = size
														
 
															+                    update['page'] = page
														
 
															+                    update['status'] = 3
														
 
															+                    model.update(update)
														
 
															+
														
 
															+                    # 通知接口 通知应用成功转换
														
 
															+                    info['page'] = page
														
 
															+                    info['file_size'] = size
														
 
															+                    info['extract_status'] = 1
														
 
															+                    self.api(info, site)
														
 
															+                    return
														
 
															+
														
 
															+            model.id = id
														
 
															+            update = {}
														
 
															+            update['status'] = 4
														
 
															+            model.update(update)
														
 
															+            # 通知接口 通知应用失败转换
														
 
															+            info['page'] = 0
														
 
															+            info['file_size'] = 0
														
 
															+            info['extract_status'] = 2
														
 
															+            self.api(info, site)
														
 
															+
														
 
															+    def api(self, info, site):
														
 
															+        if 'file_id' in info and info['file_id']:
														
 
															+            api = site['api']
														
 
															+
														
 
															+            appid = site['appid']
														
 
															+            appsecret = site['appsecret']
														
 
															+            timestamp = Demeter.time()
														
 
															+            nonce = Demeter.hash()
														
 
															+            file = info['key']
														
 
															+            file_id = info['file_id']
														
 
															+            uid = info['uid']
														
 
															+
														
 
															+            param = self.signature(site['id'], appid, appsecret, timestamp, nonce, file, file_id, uid)
														
 
															+
														
 
															+            param['url'] = 'main/view'
														
 
															+            param['img'] = info['url'] + '.jpg'
														
 
															+            param['page'] = info['page']
														
 
															+            param['ext'] = info['ext']
														
 
															+            param['file_size'] = info['file_size']
														
 
															+            param['status'] = info['extract_status']
														
 
															+
														
 
															+            Demeter.curl(api, param, 'post')
														
 
															+
														
 
															+    def pic(self, info):
														
 
															+        from extract2jpg import extract2jpg
														
 
															+        from wand.image import Image
														
 
															+        width = 800
														
 
															+        # 对生成的图片进行缩放
														
 
															+        files = File.getFiles(info['path'])
														
 
															+        if files:
														
 
															+            for file in files:
														
 
															+                if 'jpg' in file or 'png' in file:
														
 
															+                    file = info['path'] + file
														
 
															+                    with Image(filename=file) as img:
														
 
															+                        target_width, target_height = self.getSize(width, img.width, img.height)
														
 
															+                        img.sample(target_width, target_height)
														
 
															+                        img.save(filename=file)
														
 
															+
														
 
															+        # 生成图片
														
 
															+        dest = info['html'] + '.photo'
														
 
															+        result = extract2jpg.extract_extract2jpg(info['extract'], dest, pages="0,1")
														
 
															+
														
 
															+        i = 0
														
 
															+        for j in result[0]['output_jpgfiles']:
														
 
															+            source = j
														
 
															+            if i == 0:
														
 
															+                dest = info['html'] + '.jpg'
														
 
															+            else:
														
 
															+                dest = info['html'] + '.jpg_' + str(i) + '.jpg'
														
 
															+            command = 'mv '+source+' ' + dest
														
 
															+            Shell.popen(command)
														
 
															+            
														
 
															+            with Image(filename=dest) as img:
														
 
															+                target_width, target_height = self.getSize(width, img.width, img.height)
														
 
															+                img.sample(target_width, target_height)
														
 
															+                img.save(filename=dest)
														
 
															+            i = i+1
														
 
															+
														
 
															+        '''
														
 
															+        from wand.image import Image
														
 
															+        extract = Image(filename=source, resolution=50)
														
 
															+        jpg = extract.extract('jpg')
														
 
															+        req_image = []
														
 
															+        i = 0
														
 
															+        for img in jpg.sequence:
														
 
															+            if i == 0:
														
 
															+                img_page = Image(image=img)
														
 
															+                req_image.append(img_page.make_blob('jpg'))
														
 
															+            i = i+1
														
 
															+
														
 
															+        for img in req_image:
														
 
															+            ff = open(dest, 'wb')
														
 
															+            ff.write(img)
														
 
															+            ff.close()
														
 
															+        '''
														
 
															+
														
 
															+
														
 
															+    def getSize(self, target_width, img_width, img_height):
														
 
															+        if img_width > target_width:
														
 
															+            ratio = target_width / img_width
														
 
															+            target_height = int(ratio * img_height)
														
 
															+        else:
														
 
															+            target_width = img_width
														
 
															+            target_height = img_height
														
 
															+        return target_width, target_height
														
 
															+
														
 
															+    def string_switch(self, x,y,z,s=1):
														
 
															+        with open(x, "r", encoding="utf-8") as f:
														
 
															+            #readlines以列表的形式将文件读出
														
 
															+            lines = f.readlines()
														
 
															+     
														
 
															+        with open(x, "w", encoding="utf-8") as f_w:
														
 
															+            #定义一个数字，用来记录在读取文件时在列表中的位置
														
 
															+            n = 0
														
 
															+            #默认选项，只替换第一次匹配到的行中的字符串
														
 
															+            if s == 1:
														
 
															+                for line in lines:
														
 
															+                    if y in line:
														
 
															+                        line = line.replace(y,z)
														
 
															+                        f_w.write(line)
														
 
															+                        n += 1
														
 
															+                        break
														
 
															+                    f_w.write(line)
														
 
															+                    n += 1
														
 
															+                #将剩余的文本内容继续输出
														
 
															+                for i in range(n,len(lines)):
														
 
															+                    f_w.write(lines[i])
														
 
															+            #全局匹配替换
														
 
															+            elif s == 'g':
														
 
															+                for line in lines:
														
 
															+                    if y in line:
														
 
															+                        line = line.replace(y,z)
														
 
															+                    f_w.write(line)
														
--- a/service/extract/loader.py
+++ b/service/extract/loader.py
@@ -0,0 +1,27 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+
														
 
															+class Loader(object):
														
 
															+    def get(self, file, param = {}):
														
 
															+        if 'http' in file:
														
 
															+            loader = 'web'
														
 
															+        elif File.exists(file):
														
 
															+            if '.csv' in file:
														
 
															+                loader = 'csv'
														
 
															+            elif '.pdf' in file:
														
 
															+                loader = 'pdf'
														
 
															+            elif '.html' in file:
														
 
															+                loader = 'html'
														
 
															+            elif '.json' in file:
														
 
															+                loader = 'json'
														
 
															+            elif '.xls' in file:
														
 
															+                loader = 'excel'
														
 
															+            elif '.ppt' in file:
														
 
															+                loader = 'ppt'
														
 
															+            elif '.doc' in file:
														
 
															+                loader = 'word'
														
 
															+            elif '.jpg' in file or '.png' in file or '.gif' in file or '.webp' in file:
														
 
															+                loader = 'img'
														
 
															+            else:
														
 
															+                loader = 'text'
														
 
															+        return Demeter.service(loader, 'extract.docs').init(file, param)
														
--- a/service/extract/parser.py
+++ b/service/extract/parser.py
@@ -0,0 +1,122 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+# 提取器
														
 
															+class Parser(object):
														
 
															+
														
 
															+    def get(self, id=0, site_id = 0, uid = 0, source_id = 0, source = '', notify='', sync=True, method='json'):
														
 
															+        extract = Demeter.model('extract')
														
 
															+        if int(id) > 0:
														
 
															+            extract.id = id
														
 
															+        else:
														
 
															+            extract.key = self.getKey(site_id, source)
														
 
															+        data = extract.select(type='fetchone')
														
 
															+        if not data:
														
 
															+            if not source:
														
 
															+                return source
														
 
															+            info = self.getFile(site_id, source)
														
 
															+            info['uid'] = uid
														
 
															+            info['source_id'] = source_id
														
 
															+            info['notify'] = notify
														
 
															+            info['status'] = 1
														
 
															+            info['id'] = Demeter.service('common').update('extract', False, info)
														
 
															+        else:
														
 
															+            info = data
														
 
															+        if sync:
														
 
															+            return self.handle(info, method);
														
 
															+        return info['id']
														
 
															+
														
 
															+    def getFile(self, site_id, file):
														
 
															+        info = {}
														
 
															+        (filepath,temp) = os.path.split(file)
														
 
															+        (filename,extension) = os.path.splitext(temp)
														
 
															+        info['site_id'] = site_id;
														
 
															+        info['source'] = file
														
 
															+        info['key'] = self.getKey(site_id, file)
														
 
															+        info['ext'] = extension
														
 
															+        info['name'] = filename
														
 
															+        info['file'] = file
														
 
															+        info['path'] = filepath
														
 
															+        info = self.getLocal(info)
														
 
															+        info['size'] = os.path.getsize(info['file'])
														
 
															+        return info
														
 
															+
														
 
															+    def getKey(self, site_id, file):
														
 
															+        return Demeter.md5(str(site_id) + '_' + str(file))
														
 
															+
														
 
															+    def getLocal(self, info):
														
 
															+        if 'http' in info['source']:
														
 
															+            day = str(date.today())
														
 
															+            day = day.split('-')
														
 
															+            filename =  info['key']
														
 
															+            filepath = str(info['site_id']) + '/' + day[0] + '/' + day[1] + '/' + day[2]
														
 
															+        else:
														
 
															+            filename = info['name']
														
 
															+            filepath = info['path']
														
 
															+
														
 
															+        if 'save' in Demeter.config['setting']:
														
 
															+            filepath = File.mkdirs(os.path.join(Demeter.config['setting']['save'], filepath)) + '/' + filename
														
 
															+        else:
														
 
															+            filepath = File.mkdirs(os.path.join(Demeter.path, 'runtime','files', filepath)) + '/' + filename
														
 
															+
														
 
															+        info['file'] = filepath + info['ext']
														
 
															+        info['path'] = filepath + '/'
														
 
															+        if File.exists(info['file']):
														
 
															+            return info
														
 
															+        else:
														
 
															+            self.download(info['source'], info['file']);
														
 
															+            return info
														
 
															+
														
 
															+    def download(self, file, local):
														
 
															+        if 'http' in file:
														
 
															+            import requests
														
 
															+            r = requests.get(file, stream=True)
														
 
															+            with open(local, 'wb') as up:
														
 
															+                for chunk in r.iter_content(chunk_size=1024):
														
 
															+                    if chunk:
														
 
															+                        up.write(chunk)
														
 
															+        else:
														
 
															+            import shutil
														
 
															+            shutil.copyfile(file, local)
														
 
															+
														
 
															+        if File.exists(local):
														
 
															+            return True
														
 
															+        return False
														
 
															+
														
 
															+    def handle(self, info, method):
														
 
															+        param = {}
														
 
															+        param['method'] = 'extract'
														
 
															+        param['page'] = 0
														
 
															+        param['status'] = 4
														
 
															+        param['source_id'] = info['source_id']
														
 
															+        status = True
														
 
															+        if info['status'] == 1 or info['status'] == 4:
														
 
															+            status = False
														
 
															+
														
 
															+        #if info and status == False:
														
 
															+        if info:
														
 
															+            Demeter.service('common').update('extract', info['id'], {'status':2})
														
 
															+
														
 
															+            if not File.exists(info['file']):
														
 
															+                self.download(info['source'], info['file'])
														
 
															+            if True:
														
 
															+                File.mkdir(info['path'])
														
 
															+                obj = Demeter.service('loader', 'extract').get(info['file'], {'path':info['path']})
														
 
															+                func = getattr(obj, method)
														
 
															+                result = func()
														
 
															+                if result and 'page' in result and result['page'] > 0:
														
 
															+                    param['content'] = result['content']
														
 
															+                    param['page'] = result['page']
														
 
															+                    param['status'] = 3
														
 
															+                    if method == 'json':
														
 
															+                        method = 1
														
 
															+                    else:
														
 
															+                        method = 2
														
 
															+                    data = {'extract_id': info['id'], 'method' : method}
														
 
															+                    content = Demeter.service('common').one('extract_content', **data)
														
 
															+                    if not content:
														
 
															+                        result = json.dumps(result, ensure_ascii=False)
														
 
															+                        data['content'] = result
														
 
															+                        Demeter.service('common').update('extract_content', False, data)
														
 
															+            Demeter.service('common').update('extract', info['id'], {'status':param['status'], 'page':param['page']})
														
 
															+            Demeter.service('callback').send(info['site_id'], param)
														
 
															+            return param
														
--- a/service/linker/__init__.py
+++ b/service/linker/__init__.py
@@ -0,0 +1 @@
 
															+# -*- coding: utf-8 -*-
														
--- a/service/linker/__load__.py
+++ b/service/linker/__load__.py
@@ -0,0 +1,3 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from demeter.core import *
														
 
															+import os
														
--- a/service/linker/ali.py
+++ b/service/linker/ali.py
@@ -0,0 +1,12 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+from langchain_community.chat_models.tongyi import ChatTongyi
														
 
															+
														
 
															+class Ali(object):
														
 
															+
														
 
															+    def load(self, model = 'qwen-plus-latest', streaming = True):
														
 
															+        return ChatTongyi(
														
 
															+            model=model,
														
 
															+            api_key=Demeter.config['ali']['api_key'],
														
 
															+            streaming=streaming,
														
 
															+        )
														
--- a/service/linker/baidu.py
+++ b/service/linker/baidu.py
@@ -0,0 +1,13 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+from langchain_community.chat_models import QianfanChatEndpoint
														
 
															+
														
 
															+class Baidu(object):
														
 
															+
														
 
															+    def load(self, model = 'ERNIE-Bot-turbo', streaming = True):
														
 
															+        for key,value in Demeter.config['baidu'].items():
														
 
															+            os.environ[key.upper()] = value
														
 
															+        return QianfanChatEndpoint(
														
 
															+            streaming=streaming,
														
 
															+            model=model,
														
 
															+        )
														
--- a/service/linker/deepseek.py
+++ b/service/linker/deepseek.py
@@ -0,0 +1,13 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+from langchain.chat_models import ChatOpenAI
														
 
															+
														
 
															+class Deepseek(object):
														
 
															+
														
 
															+    def load(self, model = '', streaming = True):
														
 
															+        return ChatOpenAI(
														
 
															+            model_name=model,
														
 
															+            openai_api_key=Demeter.config['dp']['api_key'],
														
 
															+            openai_api_base="https://api.deepseek.com",
														
 
															+            streaming=streaming,
														
 
															+        )
														
--- a/service/linker/moonshot.py
+++ b/service/linker/moonshot.py
@@ -0,0 +1,12 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+from langchain_community.chat_models import MoonshotChat
														
 
															+
														
 
															+class Moonshot(object):
														
 
															+
														
 
															+    def load(self, model = 'moonshot-v1-32k', streaming = True):
														
 
															+        return MoonshotChat(
														
 
															+            model=model,
														
 
															+            moonshot_api_key=Demeter.config['moonshot']['api_key'],
														
 
															+            streaming=streaming,
														
 
															+        )
														
--- a/service/linker/spark.py
+++ b/service/linker/spark.py
@@ -0,0 +1,15 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+from langchain_community.chat_models import SparkLLM
														
 
															+
														
 
															+class Spark(object):
														
 
															+
														
 
															+    def load(self, model = 'qwen-turbo', streaming = True):
														
 
															+        return SparkLLM(  # 科大讯飞星火（豆包）适配
														
 
															+            app_id=Demeter.config['spark']['app_id'],
														
 
															+            api_key=Demeter.config['spark']['api_key'],
														
 
															+            api_secret=Demeter.config['spark']['api_secret'],
														
 
															+            domain=Demeter.config['spark']['domain'],
														
 
															+            spark_url=Demeter.config['spark']['spark_url'],
														
 
															+            streaming=streaming,
														
 
															+        )
														
--- a/service/linker/zhipu.py
+++ b/service/linker/zhipu.py
@@ -0,0 +1,12 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+from langchain.chat_models import ChatOpenAI
														
 
															+
														
 
															+class Zhipu(object):
														
 
															+
														
 
															+    def load(self, model = 'glm-4', streaming = True):
														
 
															+        return ZhipuAI(
														
 
															+            model=model,
														
 
															+            api_key=Demeter.config['zhipu']['api_key'],
														
 
															+            streaming=streaming,
														
 
															+        )
														
--- a/service/loader.py
+++ b/service/loader.py
@@ -0,0 +1,47 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from .__load__ import *
														
 
															+from gevent import monkey; monkey.patch_socket()
														
 
															+import gevent
														
 
															+class Loader(object):
														
 
															+
														
 
															+    # 获取
														
 
															+    def get(self, obj='', module='', **param):
														
 
															+        if 'sync' in param and param['sync']:
														
 
															+            return Demeter.service(obj, module).get(**param)
														
 
															+        else:
														
 
															+            param['sync'] = False
														
 
															+            id = Demeter.service(obj, module).get(**param)
														
 
															+            redis = Demeter.redis()
														
 
															+            config = Demeter.config['redis']
														
 
															+            content = obj + '|' + module + '|' + str(id) 
														
 
															+            redis.rpush(config['name'], content)
														
 
															+            return content
														
 
															+
														
 
															+    # 启动任务
														
 
															+    def start(self):
														
 
															+        gevent.joinall([
														
 
															+            gevent.spawn(self.run),
														
 
															+        ])
														
 
															+
														
 
															+    # 定时运行异步任务
														
 
															+    def run(self):
														
 
															+        timeSleep = 1
														
 
															+        redis = Demeter.redis()
														
 
															+        config = Demeter.config['redis']
														
 
															+        i = 0
														
 
															+        while 1:
														
 
															+            content = redis.lpop(config['name'])
														
 
															+            if content:
														
 
															+                print(content)
														
 
															+                command = self.command(content.decode('utf-8'))
														
 
															+                Shell.popen(command, False, False)
														
 
															+            i = i+1
														
 
															+            if i >= 10:
														
 
															+                gevent.sleep(timeSleep)
														
 
															+                i = 0
														
 
															+
														
 
															+    def command(self, content):
														
 
															+        temp = content.split('|')
														
 
															+        python_path = sys.executable
														
 
															+        loader_path = os.path.join(File.path(), 'loader.py')  # 生成系统规范路径
														
 
															+        return f'"{python_path}" "{loader_path}" -o {temp[0]} -m {temp[1]} -i {temp[2]}'
														
--- a/service/spliter/__init__.py
+++ b/service/spliter/__init__.py
@@ -0,0 +1 @@
 
															+# -*- coding: utf-8 -*-
	`@@ -0,0 +1,2 @@`
			`+# -- coding: utf-8 --`
			`+from demeter.admin.page.__load__ import *`
	`@@ -0,0 +1 @@`
			`+[["id", 1], ["extract_id", 1], ["method", 1], ["content", 1], ["state", 1], ["cdate", 1]]`
	`@@ -0,0 +1 @@`
			`+[["id", 1], ["name", 1], ["link", 1], ["appid", 1], ["appsecret", 1], ["sdate", 1], ["edate", 1], ["api", 1], ["state", 1], ["cdate", 1]]`