golang知識圖譜NLP實戰第四節——關係抽取完善邏輯

阿新 • • 發佈：2019-02-06

用golang應用提交文字給這個hanlp服務，返回json資料格式的依存句法分析結果。

//這個是專門解析json的
package main

import (
	"encoding/json"
	"fmt"
	"log"
	"net/url"

	"github.com/astaxie/beego/httplib"
)

type Dict struct {
	SBV []HanlpJson
	VOB []HanlpJson
	IOB []HanlpJson
	FOB []HanlpJson
	DBL []HanlpJson
	ATT []HanlpJson
	ADV []HanlpJson
	CMP []HanlpJson
	COO []HanlpJson
	POB []HanlpJson
	LAD []HanlpJson
	RAD []HanlpJson
	IS  []HanlpJson
	HED []HanlpJson
}

type HanlpResult struct {
	Result HanlpWord `json:"result"`
}

type HanlpWord struct {
	Word []HanlpJson `json:"word"`
}

//用於json資料解析
type HanlpJson struct {
	ID      int64
	LEMMA   string
	CPOSTAG string
	POSTAG  string
	HEAD    Json
	DEPREL  string
	NAME    string
}

type Json struct {
	ID      int64
	LEMMA   string
	CPOSTAG string
	POSTAG  string
	DEPREL  string
	NAME    string
}

type Ltp2 struct {
	Ltptwo []Ltp1
}

type Ltp1 struct { //這個辦法不行，保留！
	Ltpone []Ltp
}

type Ltp struct {
	Id        int64  `json:"id"`
	Cont      string `json:"cont"`
	Pos       string `json:"pos"`
	Ne        string `json:"ne"`
	Parent    int64  `json:"parent"`
	Relate    string `json:"relate"`
	Semparent int64  `json:"semparent"`
	Semrelate string `json:"semrelate"`
	Arg       []Arg1 `json:"arg"`
	Sem       []Sem1 `json:"sem"`
}

type Sem1 struct {
	Id     int64  `json:"id"`
	Parent int64  `json:"parent"`
	Relate string `json:"relate"`
}

type Arg1 struct {
	Id   int64  `json:"id"`
	Type string `json:"type"`
	Beg  int64  `json:"beg"`
	End  int64  `json:"end"`
}

func main() {
	link := url.QueryEscape("輸水乾線從佛山市順德區杏壇鎮西江干流中央的鯉魚洲島端部取水")
	req := httplib.Post("http://localhost:8888/max?sentence=" + link)
	str, err := req.String()
	if err != nil {
		log.Fatal(err)
	}
	//	fmt.Println(str)
	//json字串解析到結構體
	var hanlpresult HanlpResult
	err = json.Unmarshal([]byte(str), &hanlpresult)
	if err != nil {
		log.Fatal(err)
	}
	//	fmt.Println(hanlpresult.Result.Word)
	hanlp := hanlpresult.Result.Word
	dict := make([]Dict, 0)
	for _, w := range hanlp {
		dict1 := make([]Dict, 1)
		for _, x := range hanlp {
			if w.ID == x.HEAD.ID {
				list1 := make([]HanlpJson, 1)
				list1[0] = x
				switch x.DEPREL {
				case "主謂關係":
					dict1[0].SBV = list1
				case "動賓關係":
					dict1[0].VOB = list1
				case "間賓關係":
					dict1[0].IOB = list1
				case "前置賓語":
					dict1[0].FOB = list1
				case "兼語":
					dict1[0].DBL = list1
				case "定中關係":
					dict1[0].ATT = list1
				case "狀中結構":
					dict1[0].ADV = list1
				case "動補結構":
					dict1[0].CMP = list1
				case "並列關係":
					dict1[0].COO = list1
				case "介賓關係":
					dict1[0].POB = list1
				case "左附加關係":
					dict1[0].LAD = list1
				case "右附加關係":
					dict1[0].RAD = list1
				case "獨立結構":
					dict1[0].IS = list1
				case "核心關係":
					dict1[0].HED = list1
				}
				//				bb = make([]Hanlp, 0)
			}
		}
		dict = append(dict, dict1...)
	}
	//	fmt.Println(dict)
	for i := 0; i < len(dict); i++ {
		extract(hanlp, dict, i)
	}
}

func extract(hanlp []HanlpJson, dict []Dict, i int) {
	w := hanlp[i]
	ww := dict[i]
	//主謂賓關係：劉小緒生於四川
	if len(ww.SBV) > 0 && len(ww.VOB) > 0 {
		entity1 := ww.SBV[0].LEMMA
		// 排除：劉小緒和李華是朋友
		prep := ww.SBV[0]
		prepIndex := prep.ID - 1
		prepDict := dict[prepIndex] //這個寫法注意，當做dict陣列的索引和它ID是一致的
		if len(prepDict.COO) > 0 {
			relation := ww.VOB[0].LEMMA
			entity2 := prepDict.COO[0].LEMMA
			fmt.Println(entity1 + "," + relation + "," + entity2)
		} else {
			entity2 := ww.VOB[0].LEMMA
			relation := w.LEMMA
			fmt.Println(entity1 + "," + relation + "," + entity2)
		}
	}

	// 動補結構：劉小緒洗乾淨了衣服
	//"主謂關係"]
	//"動賓關係"]
	//"動補結構"]
	if len(ww.SBV) > 0 && len(ww.VOB) > 0 && len(ww.CMP) > 0 {
		entity1 := ww.SBV[0].LEMMA
		complement := ww.CMP[0].LEMMA
		entity2 := ww.VOB[0].LEMMA
		if len(ww.RAD) > 0 { //右附加關係
			subjoin := ww.RAD[0].LEMMA
			relation := w.LEMMA + complement + subjoin
			fmt.Println(entity1 + "," + relation + "," + entity2)
		} else {
			relation := w.LEMMA + complement
			fmt.Println(entity1 + "," + relation + "," + entity2)
		}
	}

	//定中關係
	if len(ww.ATT) > 0 {
		entity1 := ww.ATT[0].LEMMA
		relation := w.LEMMA
		for _, ii := range dict { //這裡要用dict maps陣列
			//"主謂關係"]
			//"動賓關係"]
			if len(ii.SBV) > 0 && len(ii.VOB) > 0 {
				if ii.SBV[0].LEMMA == relation {
					entity2 := ii.VOB[0].LEMMA
					fmt.Println(entity1 + "," + relation + "," + entity2)
				}
			}
		}
	}

	// 狀動結構：父親非常喜歡跑步
	// 非常 是 跑步的狀語，關係應該為非常喜歡
	//"主謂關係"]
	//動賓關係"]
	//"狀中結構"]
	if len(ww.SBV) > 0 && len(ww.VOB) > 0 && len(ww.ADV) > 0 {
		entity1 := ww.SBV[0].LEMMA
		adverbial := ww.ADV[0].LEMMA
		entity2 := ww.VOB[0].LEMMA
		relation := adverbial + w.LEMMA
		fmt.Println(entity1 + "," + relation + "," + entity2)
	}

	// 狀動補結構
	//"主謂關係"]
	//"動賓關係"]
	//"狀中結構"]
	//"動補結構"]
	if len(ww.SBV) > 0 && len(ww.VOB) > 0 && len(ww.ADV) > 0 && len(ww.CMP) > 0 {
		entity1 := ww.SBV[0].LEMMA
		adverbial := ww.ADV[0].LEMMA
		complement := ww.CMP[0].LEMMA
		entity2 := ww.VOB[0].LEMMA
		relation := adverbial + w.LEMMA + complement
		fmt.Println(entity1 + "," + relation + "," + entity2)
	}

	// 定語後置：父親是來自肯亞的留學生
	if w.DEPREL == "定中關係" {
		if len(ww.VOB) > 0 {
			entity1 := hanlp[w.HEAD.ID-1].LEMMA
			relation := w.LEMMA
			entity2 := ww.VOB[0].LEMMA
			fmt.Println(entity1 + "," + relation + "," + entity2)
		}
	}

	// 介賓關係：劉小緒就職於學校
	// 於 和 學校 是介賓關係
	//"主謂關係"]
	//"動補結構"]
	if len(ww.SBV) > 0 && len(ww.CMP) > 0 {
		entity1 := ww.SBV[0].LEMMA
		prep := ww.CMP[0] //maps["動補結構"][0]
		prepIndex := prep.ID - 1
		prepDict := dict[prepIndex] //這個寫法注意，當做dict陣列的索引和它ID是一致的
		if len(prepDict.POB) > 0 {
			entity2 := prepDict.POB[0].LEMMA //"介賓關係"][0]
			relation := w.LEMMA + prep.LEMMA
			fmt.Println(entity1 + "," + relation + "," + entity2)
		}
	}

	// 賓語前置結構：海洋由水組成
	if len(ww.FOB) > 0 {
		entity2 := ww.FOB[0].LEMMA //maps["前置賓語"][0]
		if len(ww.ADV) > 0 {
			adverbial := ww.ADV[0] //maps["狀中結構"][0]
			prepIndex := adverbial.ID - 1
			prepDict := dict[prepIndex]
			if len(prepDict.POB) > 0 {
				entity1 := prepDict.POB[0].LEMMA
				relation := w.LEMMA
				fmt.Println(entity1 + "," + relation + "," + entity2)
			}
		}
	}
}

golang知識圖譜NLP實戰第四節——關係抽取完善邏輯

用golang應用提交文字給這個hanlp服務，返回json資料格式的依存句法分析結果。 //這個是專門解析json的 package main import ( "encoding/json" "fmt" "log" "net/url" "github.

golang知識圖譜NLP實戰第二節——解析依存句法分析結果

1 參考資料 2 思路過程可以用hanlp做句子的依存句法分析，得到欄位如下：問題，怎樣得到json資料？怎樣讓hanlp提供服務？ 1 房頂房頂 n n _ 2 定中關係 _ _ 2 上上 nd f _ 3 狀中結構 _

golang知識圖譜NLP實戰第一節——整體思路

最大的願望是給engineercms工程師知識管理系統新增人工智慧——知識圖譜功能它包含了自然語言處理（NLP）的十大任務裡的幾項（Salesforce總結的十大任務，簡單來說包括：問答、機器翻譯、摘要、自然語言推理、情感分析、語義角色標註、關係抽取、目標導向

Scala入門到精通——第四節 Set、Map、Tuple、佇列操作實戰

本節主要內容 mutable、immutable集合 Set操作實戰 Map操作實戰 Tuple操作實戰佇列操作實戰棧操作實戰 mutable、immutable集合 Scala collections systematically d

李嘉璇 TensorFlow技術解析與實戰第四章筆記 TensorFlow基礎知識

系統架構最下層是網路通訊層和裝置管理層。網路通訊層包括 gRPC（google Remote Procedure Call Protocol）和遠端直接資料存取（Remote DirectMemory Access， RDMA），這都是在分散式計算時需要用到的。裝置管理層包

【手把手】JavaWeb 入門級專案實戰 -- 文章釋出系統（第四節）

首先，更正一下上一章中的一個小錯誤，就是在index.jsp中，banner部分沒有新增結束的標籤,加上去就OK了，我也是完善頁面的時候發現的。另外，index.jsp中引入的jQuery也需要換成本地的。 <script src="${basePath}/st

JavaWeb 入門級專案實戰 -- 文章釋出系統（第四節）

首先，更正一下上一章中的一個小錯誤，就是在index.jsp中，banner部分沒有新增結束的標籤,加上去就OK了，我也是完善頁面的時候發現的。另外，index.jsp中引入的jQuery也需要換成本地的。 <script src="${basePath}/stat

python預習－第四節

4.4 第四節 list elif eight float idt see height ＃遍歷列表所有元素 #!/usr/bin/python# -*- coding: UTF-8 -*- listm=["s","l","z","x","l","m","XX",[12

spring實戰第四版第五章pom.xml

第四版 context -c sco cas val mysql packaging core <project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/X

火雲開發課堂 - 《使用Cocos2d-x 開發3D遊戲》系列第四節:3D公告板

bold tar tracking forum dsm span 公告板 eight 第四節《使用Cocos2d-x 開發3D遊戲》系列在線課程第四節:3D公告板視頻地址：http://edu.csdn.net/course/attend/1

JAVAscript學習筆記 js句柄監聽事件第四節（原創）參考js使用表

必須 htm -c eve property blog uncaught event add <!DOCTYPE html> <html lang="en"> <head> <meta charset="UTF-8">

第四節課：幾種常見的攻擊方式

pxc wql ptc hvm oid hsv ffd stl -1 1.中間人攻擊局域網ARP攻擊受害者經過攻擊者向網關發送數據。當主機A、和主機B通信時，都由主機C來為其“轉發”，如圖一，而A、B之間並沒有真正意思上的直接通信，他們之間的信息傳遞同C作為中介來完成

第四節遠程登錄LINUX

div spa tab rar 臨時遠程連接 kth ssh-key shel 1.linux 遠程連接工具：puTTy xshell 下載地址： putty : https://www.chiark.greenend.org.uk/~sgtatham/putt

Spring 實戰-第四章-4.3 Introductions&@DeclareParents

frame 轉換 ret ger ted integer cati override pub @DeclareParents非常有意思，單獨拿出來，這個可以給實現相同接口的類增加新的共同接口，這樣在不侵入原有代碼的情況下，轉換成其他類型並擁有新的方法。這個功能在Sp

Spring 實戰-第四章-4.4 使用xml中聲明切面及引入新方法

cati sys epp proc oca cover tor ring tex 當不能直接接觸源碼時，同樣的不能給源碼增加註解，這時可以使用xml的方式聲明切面並引入新方法 CompactDisc接口 package main.java.soundsystem;

【第四節 Node.js模塊和包】

可選 obj hello keyword tor 簡單 enc mod ima 概念：模塊(Module)和包(Package)是Node.js最重要的支柱。開發一個具有一定規模的程序不可能只用一個文件，通常需要把各個功能拆分、分裝、然後組合起來。模塊正式為

OpenGL第四節：滾動和矩陣棧

模型 ide bsp else glut render load errors 文件頭文件不變 LUtil.h GLfloat gCameraX = 0.f, gCameraY = 0.f;//相機位置 bool initGL(){ 　　glViewport(

第四節數據的刪除

沒有 collect mov 進行 remove 參數 http con move remove({key:value}); 刪除必須傳遞參數 db.config_collection.remove({x:14}) 1.首先查詢 2 2.確定有數據進行刪除 db.co

第四節：dingo/API 最新版 V2.0 之 Responses （連載）

internal arr highlight previous cati list n) 改變定制因為某些某些原因，不能按時更新，唉。我會盡力，加快速度。（這句話不是翻譯的哈）原文地址——> https://github.com/dingo/api/wiki/R

python學習第四節叠代器生成器面向過程編程

break 對象 end 面向過程編程捕捉捕捉異常就會 python學習因此 1：什麽是叠代可以直接作用於for循環的對象統稱為可叠代對象(Iterable)。可以被next()函數調用並不斷返回下一個值的對象稱為叠代器(Iterator

golang知識圖譜NLP實戰第四節——關係抽取完善邏輯

相關推薦