routes.py 32 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950
  1. from flask import request, jsonify, send_file, current_app
  2. from app.api.meta_data import bp
  3. from app.models.result import success, failed
  4. import logging
  5. import io
  6. from minio import Minio
  7. from minio.error import S3Error
  8. from app.services.neo4j_driver import neo4j_driver
  9. from app.core.meta_data import (
  10. get_formatted_time,
  11. meta_list,
  12. meta_kinship_graph,
  13. parse_text,
  14. handle_txt_graph,
  15. get_file_content,
  16. text_resource_solve,
  17. handle_id_unstructured,
  18. solve_unstructured_data
  19. )
  20. from app.core.system.auth import require_auth
  21. logger = logging.getLogger("app")
  22. def get_minio_client():
  23. """获取 MinIO 客户端实例"""
  24. return Minio(
  25. current_app.config['MINIO_HOST'],
  26. access_key=current_app.config['MINIO_USER'],
  27. secret_key=current_app.config['MINIO_PASSWORD'],
  28. secure=current_app.config['MINIO_SECURE']
  29. )
  30. def get_minio_config():
  31. """获取 MinIO 配置"""
  32. return {
  33. 'MINIO_BUCKET': current_app.config['MINIO_BUCKET'],
  34. 'PREFIX': current_app.config['PREFIX'],
  35. 'ALLOWED_EXTENSIONS': current_app.config['ALLOWED_EXTENSIONS']
  36. }
  37. def allowed_file(filename):
  38. """检查文件扩展名是否允许"""
  39. if '.' not in filename:
  40. return False
  41. ext = filename.rsplit('.', 1)[1].lower()
  42. return ext in get_minio_config()['ALLOWED_EXTENSIONS']
  43. # 元数据列表
  44. @bp.route('/node/list', methods=['POST'])
  45. def meta_node_list():
  46. try:
  47. if not request.json:
  48. return jsonify(failed("请求数据不能为空"))
  49. # 从请求中获取分页参数
  50. page = int(request.json.get('current', 1))
  51. page_size = int(request.json.get('size', 10))
  52. # 获取搜索参数
  53. search = request.json.get('search', '')
  54. name_en_filter = request.json.get('name_en', None)
  55. name_zh_filter = request.json.get('name_zh', None)
  56. category_filter = request.json.get('category', None)
  57. time_filter = request.json.get('time', None)
  58. tag_filter = request.json.get('tag', None)
  59. # 调用核心业务逻辑
  60. result, total_count = meta_list(
  61. page,
  62. page_size,
  63. search,
  64. name_en_filter,
  65. name_zh_filter,
  66. category_filter,
  67. time_filter,
  68. tag_filter
  69. )
  70. # 返回结果
  71. return jsonify(success({
  72. "records": result,
  73. "total": total_count,
  74. "size": page_size,
  75. "current": page
  76. }))
  77. except Exception as e:
  78. logger.error(f"获取元数据列表失败: {str(e)}")
  79. return jsonify(failed(str(e)))
  80. # 元数据图谱
  81. @bp.route('/node/graph', methods=['POST'])
  82. def meta_node_graph():
  83. try:
  84. if not request.json:
  85. return jsonify(failed("请求数据不能为空"))
  86. # 从请求中获取节点ID
  87. node_id = request.json.get('nodeId')
  88. # 调用核心业务逻辑
  89. result = meta_kinship_graph(node_id)
  90. # 返回结果
  91. return jsonify(success(result))
  92. except Exception as e:
  93. logger.error(f"获取元数据图谱失败: {str(e)}")
  94. return jsonify(failed(str(e)))
  95. # 删除元数据
  96. @bp.route('/node/delete', methods=['POST'])
  97. def meta_node_delete():
  98. try:
  99. if not request.json:
  100. return jsonify(failed("请求数据不能为空"))
  101. # 从请求中获取节点ID
  102. node_id = request.json.get('id')
  103. # 删除节点逻辑
  104. with neo4j_driver.get_session() as session:
  105. cypher = "MATCH (n) WHERE id(n) = $node_id DETACH DELETE n"
  106. session.run(cypher, node_id=int(node_id))
  107. # 返回结果
  108. return jsonify(success({}))
  109. except Exception as e:
  110. logger.error(f"删除元数据失败: {str(e)}")
  111. return jsonify(failed(str(e)))
  112. # 编辑元数据
  113. @bp.route('/node/edit', methods=['POST'])
  114. def meta_node_edit():
  115. try:
  116. if not request.json:
  117. return jsonify(failed("请求数据不能为空"))
  118. # 从请求中获取节点ID
  119. node_id = request.json.get('id')
  120. if not node_id:
  121. return jsonify(failed("节点ID不能为空"))
  122. # 获取节点
  123. with neo4j_driver.get_session() as session:
  124. # 查询节点信息
  125. cypher = """
  126. MATCH (n:DataMeta)
  127. WHERE id(n) = $node_id
  128. RETURN n
  129. """
  130. result = session.run(cypher, node_id=int(node_id))
  131. node = result.single()
  132. if not node or not node["n"]:
  133. return jsonify(failed("节点不存在"))
  134. # 获取节点数据
  135. node_data = dict(node["n"])
  136. node_data["id"] = node["n"].id
  137. # 获取标签信息
  138. tag_cypher = """
  139. MATCH (n:DataMeta)-[:LABEL]->(t:DataLabel)
  140. WHERE id(n) = $node_id
  141. RETURN t
  142. """
  143. tag_result = session.run(tag_cypher, node_id=int(node_id))
  144. tag = tag_result.single()
  145. # 获取主数据信息
  146. master_data_cypher = """
  147. MATCH (n:DataMeta)-[:master_data]->(m:master_data)
  148. WHERE id(n) = $node_id
  149. RETURN m
  150. """
  151. master_data_result = session.run(
  152. master_data_cypher, node_id=int(node_id)
  153. )
  154. master_data = master_data_result.single()
  155. # 构建返回数据
  156. response_data = [{
  157. "master_data": (
  158. master_data["m"].id
  159. if master_data and master_data["m"] else None
  160. ),
  161. "name_zh": node_data.get("name_zh", ""),
  162. "name_en": node_data.get("name_en", ""),
  163. "create_time": node_data.get("create_time", ""),
  164. "update_time": node_data.get("update_time", ""),
  165. "status": bool(node_data.get("status", True)),
  166. "data_type": node_data.get("data_type", ""),
  167. "tag": {
  168. "name_zh": (
  169. tag["t"].get("name_zh", "")
  170. if tag and tag["t"] else None
  171. ),
  172. "name_en": (
  173. tag["t"].get("name_en", "")
  174. if tag and tag["t"] else None
  175. ),
  176. "id": tag["t"].id if tag and tag["t"] else None
  177. },
  178. "affiliation": node_data.get("affiliation"),
  179. "category": node_data.get("category"),
  180. "alias": node_data.get("alias"),
  181. "describe": node_data.get("describe")
  182. }]
  183. logger.info(f"成功获取元数据节点: ID={node_data['id']}")
  184. return jsonify(success(response_data))
  185. except Exception as e:
  186. logger.error(f"获取元数据节点失败: {str(e)}")
  187. return jsonify(failed(str(e)))
  188. # 增加元数据
  189. @bp.route('/check', methods=['GET'])
  190. def meta_check():
  191. """
  192. 检查元数据中文名是否已存在
  193. 请求参数:
  194. - name_zh: 元数据中文名(URL参数)
  195. 返回:
  196. - exists: true/false 表示是否存在
  197. """
  198. try:
  199. name_zh = request.args.get('name_zh')
  200. if not name_zh:
  201. return jsonify(failed("缺少name_zh参数"))
  202. # 查询数据库检查是否存在
  203. with neo4j_driver.get_session() as session:
  204. cypher = """
  205. MATCH (n:DataMeta {name_zh: $name_zh})
  206. RETURN count(n) > 0 as exists
  207. """
  208. result = session.run(cypher, name_zh=name_zh)
  209. record = result.single()
  210. if record:
  211. exists = record["exists"]
  212. logger.info(f"检查元数据 '{name_zh}': {'存在' if exists else '不存在'}")
  213. return jsonify(success({
  214. "exists": exists,
  215. "name_zh": name_zh
  216. }, "查询成功"))
  217. else:
  218. return jsonify(success({
  219. "exists": False,
  220. "name_zh": name_zh
  221. }, "查询成功"))
  222. except Exception as e:
  223. logger.error(f"检查元数据失败: {str(e)}")
  224. return jsonify(failed(f"检查失败: {str(e)}"))
  225. @bp.route('/node/add', methods=['POST'])
  226. def meta_node_add():
  227. try:
  228. if not request.json:
  229. return jsonify(failed("请求数据不能为空"))
  230. # 从请求中获取节点信息
  231. node_name_zh = request.json.get('name_zh')
  232. node_type = request.json.get('data_type')
  233. node_category = request.json.get('category')
  234. node_alias = request.json.get('alias')
  235. node_affiliation = request.json.get('affiliation')
  236. node_tag = request.json.get('tag')
  237. node_desc = request.json.get('describe')
  238. node_status = bool(request.json.get('status', True))
  239. node_name_en = request.json.get('name_en')
  240. if not node_name_zh:
  241. return jsonify(failed("节点名称不能为空"))
  242. if not node_type:
  243. return jsonify(failed("节点类型不能为空"))
  244. # 创建节点
  245. with neo4j_driver.get_session() as session:
  246. cypher = """
  247. MERGE (n:DataMeta {name_zh: $name_zh})
  248. ON CREATE SET n.name_en = $name_en,
  249. n.data_type = $data_type,
  250. n.category = $category,
  251. n.alias = $alias,
  252. n.affiliation = $affiliation,
  253. n.describe = $describe,
  254. n.create_time = $create_time,
  255. n.updateTime = $update_time,
  256. n.status = $status,
  257. n.name_en = $name_en
  258. ON MATCH SET n.data_type = $data_type,
  259. n.category = $category,
  260. n.alias = $alias,
  261. n.affiliation = $affiliation,
  262. n.describe = $describe,
  263. n.updateTime = $update_time,
  264. n.status = $status,
  265. n.name_en = $name_en
  266. RETURN n
  267. """
  268. create_time = update_time = get_formatted_time()
  269. result = session.run(
  270. cypher,
  271. name_zh=node_name_zh,
  272. data_type=node_type,
  273. category=node_category,
  274. alias=node_alias,
  275. affiliation=node_affiliation,
  276. describe=node_desc,
  277. create_time=create_time,
  278. update_time=update_time,
  279. status=node_status,
  280. name_en=node_name_en
  281. )
  282. node = result.single()
  283. if node and node["n"]:
  284. node_data = dict(node["n"])
  285. node_data["id"] = node["n"].id
  286. # 如果提供了标签ID,创建标签关系
  287. if node_tag:
  288. tag_cypher = """
  289. MATCH (n:DataMeta), (t:DataLabel)
  290. WHERE id(n) = $node_id AND id(t) = $tag_id
  291. MERGE (n)-[r:LABEL]->(t)
  292. RETURN r
  293. """
  294. session.run(
  295. tag_cypher,
  296. node_id=node["n"].id,
  297. tag_id=int(node_tag)
  298. )
  299. logger.info(
  300. f"成功创建或更新元数据节点: "
  301. f"ID={node_data['id']}, name={node_name_zh}"
  302. )
  303. return jsonify(success(node_data))
  304. else:
  305. logger.error(f"创建元数据节点失败: {node_name_zh}")
  306. return jsonify(failed("创建元数据节点失败"))
  307. except Exception as e:
  308. logger.error(f"添加元数据失败: {str(e)}")
  309. return jsonify(failed(str(e)))
  310. # 搜索元数据
  311. @bp.route('/search', methods=['GET'])
  312. def search_metadata_route():
  313. try:
  314. keyword = request.args.get('keyword', '')
  315. if not keyword:
  316. return jsonify(success([]))
  317. cypher = """
  318. MATCH (n:DataMeta)
  319. WHERE n.name_zh CONTAINS $keyword
  320. RETURN n LIMIT 100
  321. """
  322. with neo4j_driver.get_session() as session:
  323. result = session.run(cypher, keyword=keyword)
  324. metadata_list = [dict(record["n"]) for record in result]
  325. return jsonify(success(metadata_list))
  326. except Exception as e:
  327. logger.error(f"搜索元数据失败: {str(e)}")
  328. return jsonify(failed(str(e)))
  329. # 全文检索查询
  330. @bp.route('/full/text/query', methods=['POST'])
  331. def full_text_query():
  332. try:
  333. if not request.json:
  334. return jsonify(failed("请求数据不能为空"))
  335. # 获取查询条件
  336. search_term = request.json.get('query', '')
  337. if not search_term:
  338. return jsonify(failed("查询条件不能为空"))
  339. # 执行Neo4j全文索引查询
  340. with neo4j_driver.get_session() as session:
  341. cypher = """
  342. CALL db.index.fulltext.queryNodes("DataMetaFulltext", $term)
  343. YIELD node, score
  344. RETURN node, score
  345. ORDER BY score DESC
  346. LIMIT 20
  347. """
  348. result = session.run(cypher, term=search_term)
  349. # 处理查询结果
  350. search_results = []
  351. for record in result:
  352. node_data = dict(record["node"])
  353. node_data["id"] = record["node"].id
  354. node_data["score"] = record["score"]
  355. search_results.append(node_data)
  356. return jsonify(success(search_results))
  357. except Exception as e:
  358. logger.error(f"全文检索查询失败: {str(e)}")
  359. return jsonify(failed(str(e)))
  360. # 非结构化文本查询
  361. @bp.route('/unstructure/text/query', methods=['POST'])
  362. def unstructure_text_query():
  363. try:
  364. if not request.json:
  365. return jsonify(failed("请求数据不能为空"))
  366. # 获取查询参数
  367. node_id = request.json.get('id')
  368. if not node_id:
  369. return jsonify(failed("节点ID不能为空"))
  370. # 获取节点信息
  371. node_data = handle_id_unstructured(node_id)
  372. if not node_data:
  373. return jsonify(failed("节点不存在"))
  374. # 获取对象路径
  375. object_name = node_data.get('url')
  376. if not object_name:
  377. return jsonify(failed("文档路径不存在"))
  378. # 获取 MinIO 配置
  379. minio_client = get_minio_client()
  380. config = get_minio_config()
  381. bucket_name = config['MINIO_BUCKET']
  382. # 从MinIO获取文件内容
  383. file_content = get_file_content(minio_client, bucket_name, object_name)
  384. # 解析文本内容
  385. parsed_data = parse_text(file_content)
  386. # 返回结果
  387. result = {
  388. "node": node_data,
  389. "parsed": parsed_data,
  390. "content": (
  391. file_content[:1000] + "..."
  392. if len(file_content) > 1000 else file_content
  393. )
  394. }
  395. return jsonify(success(result))
  396. except Exception as e:
  397. logger.error(f"非结构化文本查询失败: {str(e)}")
  398. return jsonify(failed(str(e)))
  399. # 文件上传
  400. @bp.route('/resource/upload', methods=['POST'])
  401. def upload_file():
  402. try:
  403. # 检查请求中是否有文件
  404. if 'file' not in request.files:
  405. return jsonify(failed("没有找到上传的文件"))
  406. file = request.files['file']
  407. # 检查文件名
  408. if not file.filename:
  409. return jsonify(failed("未选择文件"))
  410. # 保存文件名到本地变量(确保类型安全)
  411. filename = file.filename
  412. # 检查文件类型
  413. if not allowed_file(filename):
  414. return jsonify(failed("不支持的文件类型"))
  415. # 获取 MinIO 配置
  416. minio_client = get_minio_client()
  417. config = get_minio_config()
  418. # 上传到MinIO
  419. file_content = file.read()
  420. file_size = len(file_content)
  421. file_type = filename.rsplit('.', 1)[1].lower()
  422. # 提取文件名(不包含扩展名)
  423. filename_without_ext = filename.rsplit('.', 1)[0]
  424. # 生成紧凑的时间戳 (yyyyMMddHHmmss)
  425. import time
  426. timestamp = time.strftime("%Y%m%d%H%M%S", time.localtime())
  427. # 生成唯一文件名
  428. object_name = (
  429. f"{config['PREFIX']}/"
  430. f"{filename_without_ext}_{timestamp}.{file_type}"
  431. )
  432. # 上传文件
  433. minio_client.put_object(
  434. config['MINIO_BUCKET'],
  435. object_name,
  436. io.BytesIO(file_content),
  437. file_size,
  438. content_type=f"application/{file_type}"
  439. )
  440. # 返回结果
  441. return jsonify(success({
  442. "filename": file.filename,
  443. "size": file_size,
  444. "type": file_type,
  445. "url": object_name
  446. }))
  447. except Exception as e:
  448. logger.error(f"文件上传失败: {str(e)}")
  449. return jsonify(failed(str(e)))
  450. # 文件下载显示
  451. @bp.route('/resource/display', methods=['POST'])
  452. def upload_file_display():
  453. response = None
  454. try:
  455. if not request.json:
  456. return jsonify(failed("请求数据不能为空"))
  457. object_name = request.json.get('url')
  458. if not object_name:
  459. return jsonify(failed("文件路径不能为空"))
  460. # 获取 MinIO 配置
  461. minio_client = get_minio_client()
  462. config = get_minio_config()
  463. # 获取文件内容
  464. response = minio_client.get_object(config['MINIO_BUCKET'], object_name)
  465. file_data = response.read()
  466. # 获取文件名
  467. file_name = object_name.split('/')[-1]
  468. # 确定文件类型
  469. file_extension = file_name.split('.')[-1].lower()
  470. # 为不同文件类型设置合适的MIME类型
  471. mime_types = {
  472. 'pdf': 'application/pdf',
  473. 'doc': 'application/msword',
  474. 'docx': (
  475. 'application/vnd.openxmlformats-'
  476. 'officedocument.wordprocessingml.document'
  477. ),
  478. 'xls': 'application/vnd.ms-excel',
  479. 'xlsx': (
  480. 'application/vnd.openxmlformats-'
  481. 'officedocument.spreadsheetml.sheet'
  482. ),
  483. 'txt': 'text/plain',
  484. 'csv': 'text/csv'
  485. }
  486. content_type = mime_types.get(
  487. file_extension, 'application/octet-stream'
  488. )
  489. # 返回结果
  490. return jsonify(success({
  491. "filename": file_name,
  492. "type": file_extension,
  493. "contentType": content_type,
  494. "size": len(file_data),
  495. "url": f"/api/meta/resource/download?url={object_name}"
  496. }))
  497. except S3Error as e:
  498. logger.error(f"MinIO操作失败: {str(e)}")
  499. return jsonify(failed(f"文件访问失败: {str(e)}"))
  500. except Exception as e:
  501. logger.error(f"文件显示信息获取失败: {str(e)}")
  502. return jsonify(failed(str(e)))
  503. finally:
  504. if response:
  505. response.close()
  506. response.release_conn()
  507. # 文件下载接口
  508. @bp.route('/resource/download', methods=['GET'])
  509. def download_file():
  510. response = None
  511. try:
  512. object_name = request.args.get('url')
  513. if not object_name:
  514. return jsonify(failed("文件路径不能为空"))
  515. # URL解码,处理特殊字符
  516. import urllib.parse
  517. object_name = urllib.parse.unquote(object_name)
  518. # 记录下载请求信息,便于调试
  519. logger.info(f"下载文件请求: {object_name}")
  520. # 获取 MinIO 配置
  521. minio_client = get_minio_client()
  522. config = get_minio_config()
  523. # 获取文件
  524. try:
  525. response = minio_client.get_object(
  526. config['MINIO_BUCKET'], object_name
  527. )
  528. file_data = response.read()
  529. except S3Error as e:
  530. logger.error(f"MinIO获取文件失败: {str(e)}")
  531. return jsonify(failed(f"文件获取失败: {str(e)}"))
  532. # 获取文件名,并处理特殊字符
  533. file_name = object_name.split('/')[-1]
  534. # 直接从内存返回文件,不创建临时文件
  535. file_stream = io.BytesIO(file_data)
  536. # 返回文件
  537. return send_file(
  538. file_stream,
  539. as_attachment=True,
  540. download_name=file_name,
  541. mimetype="application/octet-stream"
  542. )
  543. except Exception as e:
  544. logger.error(f"文件下载失败: {str(e)}")
  545. return jsonify(failed(str(e)))
  546. finally:
  547. if response:
  548. response.close()
  549. response.release_conn()
  550. # 文本资源翻译
  551. @bp.route('/resource/translate', methods=['POST'])
  552. def text_resource_translate():
  553. try:
  554. if not request.json:
  555. return jsonify(failed("请求数据不能为空"))
  556. # 获取参数
  557. name_zh = request.json.get('name_zh', '')
  558. keyword = request.json.get('keyword', '')
  559. if not name_zh:
  560. return jsonify(failed("名称不能为空"))
  561. # 调用资源处理逻辑
  562. result = text_resource_solve(None, name_zh, keyword)
  563. return jsonify(success(result))
  564. except Exception as e:
  565. logger.error(f"文本资源翻译失败: {str(e)}")
  566. return jsonify(failed(str(e)))
  567. # 创建文本资源节点
  568. @bp.route('/resource/node', methods=['POST'])
  569. def text_resource_node():
  570. try:
  571. if not request.json:
  572. return jsonify(failed("请求数据不能为空"))
  573. # 获取参数
  574. name_zh = request.json.get('name_zh', '')
  575. name_en = request.json.get('name_en', '')
  576. keywords = request.json.get('keywords', [])
  577. keywords_en = request.json.get('keywords_en', [])
  578. object_name = request.json.get('url', '')
  579. if not name_zh or not name_en or not object_name:
  580. return jsonify(failed("参数不完整"))
  581. # 创建节点
  582. with neo4j_driver.get_session() as session:
  583. # 创建资源节点
  584. cypher = """
  585. CREATE (n:DataMeta {
  586. name_zh: $name_zh,
  587. name_en: $name_en,
  588. keywords: $keywords,
  589. keywords_en: $keywords_en,
  590. url: $object_name,
  591. create_time: $create_time,
  592. updateTime: $update_time
  593. })
  594. RETURN n
  595. """
  596. create_time = update_time = get_formatted_time()
  597. result = session.run(
  598. cypher,
  599. name_zh=name_zh,
  600. name_en=name_en,
  601. keywords=keywords,
  602. keywords_en=keywords_en,
  603. object_name=object_name,
  604. create_time=create_time,
  605. update_time=update_time
  606. )
  607. record = result.single()
  608. if not record:
  609. return jsonify(failed("创建节点失败"))
  610. node = record["n"]
  611. # 为每个关键词创建标签节点并关联
  612. for i, keyword in enumerate(keywords):
  613. if keyword:
  614. # 创建标签节点
  615. tag_cypher = """
  616. MERGE (t:Tag {name_zh: $name_zh})
  617. ON CREATE SET t.name_en = $name_en,
  618. t.create_time = $create_time
  619. RETURN t
  620. """
  621. tag_result = session.run(
  622. tag_cypher,
  623. name_zh=keyword,
  624. name_en=keywords_en[i] if i < len(keywords_en) else "",
  625. create_time=create_time
  626. )
  627. tag_record = tag_result.single()
  628. if not tag_record:
  629. continue
  630. tag_node = tag_record["t"]
  631. # 创建关系
  632. rel_cypher = """
  633. MATCH (n), (t)
  634. WHERE id(n) = $node_id AND id(t) = $tag_id
  635. CREATE (n)-[r:HAS_TAG]->(t)
  636. RETURN r
  637. """
  638. session.run(
  639. rel_cypher,
  640. node_id=node.id,
  641. tag_id=tag_node.id
  642. )
  643. # 返回创建的节点
  644. return jsonify(success(dict(node)))
  645. except Exception as e:
  646. logger.error(f"创建文本资源节点失败: {str(e)}")
  647. return jsonify(failed(str(e)))
  648. # 处理非结构化数据
  649. @bp.route('/unstructured/process', methods=['POST'])
  650. def processing_unstructured_data():
  651. try:
  652. if not request.json:
  653. return jsonify(failed("请求数据不能为空"))
  654. # 获取参数
  655. node_id = request.json.get('id')
  656. if not node_id:
  657. return jsonify(failed("节点ID不能为空"))
  658. # 获取 MinIO 配置
  659. minio_client = get_minio_client()
  660. config = get_minio_config()
  661. prefix = config['PREFIX']
  662. # 调用处理逻辑
  663. result = solve_unstructured_data(node_id, minio_client, prefix)
  664. if result:
  665. return jsonify(success({"message": "处理成功"}))
  666. else:
  667. return jsonify(failed("处理失败"))
  668. except Exception as e:
  669. logger.error(f"处理非结构化数据失败: {str(e)}")
  670. return jsonify(failed(str(e)))
  671. # 创建文本图谱
  672. @bp.route('/text/graph', methods=['POST'])
  673. def create_text_graph():
  674. try:
  675. if not request.json:
  676. return jsonify(failed("请求数据不能为空"))
  677. # 获取参数
  678. node_id = request.json.get('id')
  679. entity_zh = request.json.get('entity_zh')
  680. entity_en = request.json.get('entity_en')
  681. if not all([node_id, entity_zh, entity_en]):
  682. return jsonify(failed("参数不完整"))
  683. # 创建图谱
  684. result = handle_txt_graph(node_id, entity_zh, entity_en)
  685. if result:
  686. return jsonify(success({"message": "图谱创建成功"}))
  687. else:
  688. return jsonify(failed("图谱创建失败"))
  689. except Exception as e:
  690. logger.error(f"创建文本图谱失败: {str(e)}")
  691. return jsonify(failed(str(e)))
  692. @bp.route('/config', methods=['GET'])
  693. @require_auth
  694. def get_meta_config():
  695. """获取元数据配置信息"""
  696. config = get_minio_config()
  697. return jsonify({
  698. 'bucket_name': config['MINIO_BUCKET'],
  699. 'prefix': config['PREFIX'],
  700. 'allowed_extensions': list(config['ALLOWED_EXTENSIONS'])
  701. })
  702. # 更新元数据
  703. @bp.route('/node/update', methods=['POST'])
  704. def meta_node_update():
  705. try:
  706. if not request.json:
  707. return jsonify(failed("请求数据不能为空"))
  708. # 从请求中获取节点ID和更新数据
  709. node_id = request.json.get('id')
  710. if not node_id:
  711. return jsonify(failed("节点ID不能为空"))
  712. # 验证并转换节点ID为整数
  713. try:
  714. node_id = int(node_id)
  715. except (ValueError, TypeError):
  716. return jsonify(failed(f"节点ID必须为整数,当前值: {node_id}"))
  717. # 更新节点
  718. with neo4j_driver.get_session() as session:
  719. # 检查节点是否存在并获取当前值
  720. check_cypher = """
  721. MATCH (n:DataMeta)
  722. WHERE id(n) = $node_id
  723. RETURN n
  724. """
  725. result = session.run(check_cypher, node_id=node_id)
  726. node = result.single()
  727. if not node or not node["n"]:
  728. return jsonify(failed("节点不存在"))
  729. # 构建更新语句,只更新提供的属性
  730. update_cypher = """
  731. MATCH (n:DataMeta)
  732. WHERE id(n) = $node_id
  733. SET n.updateTime = $update_time
  734. """
  735. # 准备更新参数
  736. update_params = {
  737. 'node_id': node_id,
  738. 'update_time': get_formatted_time()
  739. }
  740. # 处理每个可能的更新字段
  741. fields_to_update = {
  742. 'name_zh': request.json.get('name_zh'),
  743. 'category': request.json.get('category'),
  744. 'alias': request.json.get('alias'),
  745. 'affiliation': request.json.get('affiliation'),
  746. 'data_type': request.json.get('data_type'),
  747. 'describe': request.json.get('describe'),
  748. 'status': request.json.get('status'),
  749. 'name_en': request.json.get('name_en')
  750. }
  751. # 只更新提供了新值的字段
  752. for field, new_value in fields_to_update.items():
  753. if new_value is not None:
  754. # 特殊处理 data_type 字段映射
  755. if field == 'data_type':
  756. update_cypher += f", n.data_type = ${field}\n"
  757. else:
  758. update_cypher += f", n.{field} = ${field}\n"
  759. update_params[field] = new_value
  760. update_cypher += "RETURN n"
  761. result = session.run(
  762. update_cypher, # type: ignore[arg-type]
  763. **update_params
  764. )
  765. updated_node = result.single()
  766. if updated_node and updated_node["n"]:
  767. node_data = dict(updated_node["n"])
  768. node_data["id"] = updated_node["n"].id
  769. # 如果更新了标签,处理标签关系
  770. tag = request.json.get('tag')
  771. if tag is not None:
  772. # 先删除现有标签关系
  773. delete_tag_cypher = """
  774. MATCH (n:DataMeta)-[r:LABEL]->(t:DataLabel)
  775. WHERE id(n) = $node_id
  776. DELETE r
  777. """
  778. session.run(delete_tag_cypher, node_id=node_id)
  779. # 创建新的标签关系
  780. is_valid_tag = (
  781. tag and isinstance(tag, dict)
  782. and 'id' in tag and tag['id']
  783. )
  784. if is_valid_tag:
  785. try:
  786. tag_id = int(tag['id'])
  787. create_tag_cypher = """
  788. MATCH (n:DataMeta), (t:DataLabel)
  789. WHERE id(n) = $node_id AND id(t) = $tag_id
  790. MERGE (n)-[r:LABEL]->(t)
  791. RETURN r
  792. """
  793. session.run(
  794. create_tag_cypher,
  795. node_id=node_id,
  796. tag_id=tag_id
  797. )
  798. except (ValueError, TypeError):
  799. logger.warning(f"标签ID无效: {tag.get('id')}")
  800. logger.info(f"成功更新元数据节点: ID={node_data['id']}")
  801. return jsonify(success(node_data))
  802. else:
  803. logger.error(f"更新元数据节点失败: ID={node_id}")
  804. return jsonify(failed("更新元数据节点失败"))
  805. except Exception as e:
  806. logger.error(f"更新元数据失败: {str(e)}")
  807. return jsonify(failed(str(e)))