创建节点和建立关系
# -*- coding:utf-8 -*-
from py2neo import Node,Relationship,Graph,NodeMatcher,RelationshipMatcher
# 数据库
graph = Graph('http://localhost:7474', auth=("neo4j", "123456"))
# 查询节点是否存在
def MatchNode(m_graph,m_label,m_attrs):
m_n = "_.name=" + "\'" + m_attrs['name'] + "\'"
matcher = NodeMatcher(m_graph)
re_value = matcher.match(m_label).where(m_n).first()
return re_value
# 创建节点
def CreateNode(m_graph,m_label,m_attrs):
re_value = MatchNode(m_graph,m_label,m_attrs)
# print(re_value)
if re_value is None:
m_node = Node(m_label,**m_attrs)
# 创建节点
n = graph.create(m_node)
return n
return None
label1 = 'Stock'
attrs1 = {"name":'招商银行',"code":'600036'}
label2 = 'SecuritiesExchange'
attrs2 = {"name":'上海证券交易所'}
CreateNode(graph,label1,attrs1)
CreateNode(graph,label2,attrs2)
# 建立两个节点的关系,如果节点不存在,不进行创建
def CreateRelationship(m_graph,m_label1,m_attrs1,m_label2,m_attrs2,m_r_name):
re_value1 = MatchNode(m_graph,m_label1,m_attrs1)
re_value2 = MatchNode(m_graph,m_label2,m_attrs2)
if re_value1 is None or re_value2 is None:
return False
m_r = Relationship(re_value1,m_r_name,re_value2)
n = graph.create(m_r)
return n
m_r_name = "证券交易所"
re_value = CreateRelationship(graph,label1,attrs1,label2,attrs2,m_r_name)
查询操作
# -*- coding:utf-8 -*-
from py2neo import Node,Relationship,Graph,NodeMatcher,RelationshipMatcher
# 数据库
graph = Graph('http://localhost:7474', auth=("neo4j", "123456"))
# 按id查询节点
def MatchNodeByID(m_graph,m_id):
matcher = NodeMatcher(m_graph)
re_value = matcher.get(m_id)
return re_value
# 按attr查询节点
def MatchNodeByAttr(m_graph,m_label,m_attrs):
m_n = "_.name=" + "\'" + m_attrs['name'] + "\'"
matcher = NodeMatcher(m_graph)
re_value = matcher.match(m_label).where(m_n).first()
return re_value
# 按label查询节点
def MatchNodeByLabel(m_graph,m_label):
matcher = NodeMatcher(m_graph)
re_value = matcher.match(m_label)
return re_value
print(MatchNodeByID(graph,0))
print(MatchNodeByAttr(graph,'Stock',{"name":'招商银行',"code":'600036'}))
print(MatchNodeByLabel(graph,'Stock'))
通过Cypher命令批量创建节点
- 下载文件
板块,公司全称,英文名称,注册地址,A股代码,A股简称,A股上市日期,A股总股本,A股流通股本,B股代码,B股 简 称,B股上市日期,B股总股本,B股流通股本,地 区,省 份,城 市,所属行业,公司网址
主板,平安银行股份有限公司,"Ping An Bank Co., Ltd.",广东省深圳市罗湖区深南东路5047号,000001,平安银行,1991-04-03,"19,405,918,198","19,405,546,950",,,,0,0,华南,广东,深圳市,J 金融业,bank.pingan.com
主板,万科企业股份有限公司,"CHINA VANKE CO., LTD.",广东省深圳市盐田区大梅沙环梅路33号万科中心,000002,万 科A,1991-01-29,"9,724,196,533","9,717,553,265",,,,0,0,华南,广东,深圳市,K 房地产,www.vanke.com
主板,深圳国华网安科技股份有限公司,"Shenzhen GuoHua Network Security Technology Co., Ltd.",广东省深圳市福田区梅林街道梅都社区中康路126号卓越梅林中心广场(南区)卓悦汇B2206A,000004,国华网安,1990-12-01,"156,003,026","116,330,763",,,,0,0,华南,广东,深圳市,I 信息技术,www.sz000004.cn
......
# -*- coding:utf-8 -*-
import urllib.request
def DownloadSZExchangeExcel():
url = 'http://www.szse.cn/api/report/ShowReport?SHOWTYPE=xlsx&CATALOGID=1110&TABKEY=tab1&random=0.4744196476238187'
downPath = 'A股列表.xlsx'
urllib.request.urlretrieve(url,downPath)
DownloadSZExchangeExcel()
# -*- coding:utf-8 -*-
import xlrd
import uuid
from py2neo import Graph
# 数据库
graph = Graph('http://localhost:7474', auth=("neo4j", "123456"))
# 创建节点
def CreateNode(m_graph,m_cypher):
m_graph.run(m_cypher)
def Excel2Nor4j(m_graph):
label = 'Stock'
# filename = 'A股列表.xls'.encode('utf-8').decode('utf-8')
readbook = xlrd.open_workbook('A股列表.xls',encoding_override="utf-8")
sheet = readbook.sheet_by_name('A股列表')
nrows = sheet.nrows
ncols = sheet.ncols
for i in range(1,nrows):
c_cmd0 = 'create(n:{0}{{code:\'{1}\','.format(label,sheet.cell(i,4).value)
c_cmd1 = 'name:\'{0}\','.format(sheet.cell(i,5).value)#.replace('A','A')
c_cmd2 = 'id:\'{0}\','.format(uuid.uuid3(uuid.NAMESPACE_DNS,sheet.cell(i,4).value).hex)
c_cmd3 = 'fullname:\'{0}\','.format(sheet.cell(i,1).value)
c_cmd4 = 'englishname:\'{0}\','.format(sheet.cell(i,2).value)
c_cmd5 = 'address:\'{0}\','.format(sheet.cell(i,3).value)
c_cmd6 = 'fdate:\'{0}\','.format(sheet.cell(i,6).value)
c_cmd7 = 'province:\'{0}\','.format(sheet.cell(i,15).value)
c_cmd8 = 'city:\'{0}\','.format(sheet.cell(i,16).value)
c_cmd9 = 'industry:\'{0}\','.format(sheet.cell(i,17).value)
c_cmd10 = 'weburl:\'{0}\'}})'.format(sheet.cell(i,18).value)
c_cmd = c_cmd0+c_cmd1+c_cmd2+c_cmd3+c_cmd4+c_cmd5+c_cmd6+c_cmd7+c_cmd8+c_cmd9+c_cmd10
print(c_cmd)
CreateNode(graph,c_cmd)
Excel2Nor4j(graph)
print("End")
# 查询某个标签的节点个数
def GetNodeCountByLabel(m_graph,m_label):
m_n = "match(n:"+m_label+") return count(n)"
return m_graph.run(m_n).data()
print(GetNodeCountByLabel(graph,"Stock"))