Skip to content

Commit 8d4f815

Browse files
committed
1.修改并整理关系导出文件夹,将公司核心图的连接信息导出;
2.导修改部分文件的函数调用依赖。
1 parent ee66c03 commit 8d4f815

File tree

11 files changed

+102954
-492617
lines changed

11 files changed

+102954
-492617
lines changed

Data/Encoding/all_edge.edgelist

Lines changed: 0 additions & 117072 deletions
This file was deleted.

Data/Encoding/all_edge_with_edgetype.edgelist

Lines changed: 0 additions & 117072 deletions
This file was deleted.

Data/Encoding/all_node_encoding.csv

Lines changed: 0 additions & 73865 deletions
This file was deleted.

Data/Encoding/com_edge.edgelist

Lines changed: 0 additions & 62595 deletions
This file was deleted.

Data/Encoding/com_edge_with_edgetype.edgelist

Lines changed: 0 additions & 62595 deletions
This file was deleted.

Data/Encoding/com_node.csv

Lines changed: 0 additions & 59401 deletions
This file was deleted.
File renamed without changes.

Data/Export/com_name_edge_type.csv

Lines changed: 102938 additions & 0 deletions
Large diffs are not rendered by default.

Data_process/data_process.py

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -76,7 +76,7 @@ def com_data_pre3(): # 整合并排序多个文件中的公司数据
7676

7777

7878
def node_encoding(): # 编码所有节点
79-
with open('../Data/Encoding/com_node.csv', 'w', encoding='utf-8', newline='') as csvfile:
79+
with open('../Data/Export/com_node.csv', 'w', encoding='utf-8', newline='') as csvfile:
8080
writer = csv.writer(csvfile, delimiter='\t')
8181
writer.writerow(['节点类型', '原标识', '编码'])
8282
# nodes = graph.find(label='USER')
@@ -126,14 +126,14 @@ def node_encoding(): # 编码所有节点
126126
def edge_formatting(): # 抽取所有边,并依照节点编码格式化
127127
d = dict()
128128
k = 0
129-
with open('../Data/Encoding/com_node.csv', 'r', encoding='utf-8', newline='') as csvfile:
129+
with open('../Data/Export/com_node.csv', 'r', encoding='utf-8', newline='') as csvfile:
130130
rows = csv.reader(csvfile, delimiter='\t')
131131
for index, row in enumerate(rows):
132132
if index == 0:
133133
continue
134134
d[row[1]] = row[2]
135135

136-
with open('../Data/Encoding/com_edge_with_edgetype.edgelist', 'w', encoding='utf-8', newline='') as edgelist:
136+
with open('../Data/Export/com_edge_with_edgetype.edgelist', 'w', encoding='utf-8', newline='') as edgelist:
137137
edgewriter = csv.writer(edgelist, delimiter='\t')
138138
with open('../Data/com_industry_tags.csv', 'r', encoding='utf-8', newline='') as csvfile:
139139
rows = csv.reader(csvfile)
@@ -284,8 +284,8 @@ def edge_formatting(): # 抽取所有边,并依照节点编码格式化
284284

285285

286286
def edgelist_process(): # 边列表处理
287-
with open('../Data/Encoding/com_edge_with_edgetype.edgelist', 'r', encoding='utf-8', newline='') as edgelist1, \
288-
open('../Data/Encoding/com_edge.edgelist', 'w', encoding='utf-8', newline='') as edgelist2:
287+
with open('../Data/Export/com_edge_with_edgetype.edgelist', 'r', encoding='utf-8', newline='') as edgelist1, \
288+
open('../Data/Export/com_edge.edgelist', 'w', encoding='utf-8', newline='') as edgelist2:
289289
edgewreader = csv.reader(edgelist1, delimiter='\t')
290290
edgewriter = csv.writer(edgelist2, delimiter='\t')
291291
for row in edgewreader:

Graph/graph_init_create.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,12 +1,12 @@
1-
from Graph.process import Con_Neo4j
2-
from py2neo import Relationship, Node
1+
from py2neo import Graph, Node, Relationship
32
import csv
43
from Data_process.data_extraction import file_name
54
import re
65
import time
76

87

9-
graph = Con_Neo4j(http='http://127.0.0.1:7474', username='neo4j', password='123456')
8+
# 连接图数据库
9+
graph = Graph('http://127.0.0.1:7474', username='neo4j', password='123456', bolt=True, secure=False)
1010

1111

1212
def com_type(code): # 识别公司代码所属类别,包括:深A、沪A、深B、沪B、三板、其它、非上市

0 commit comments

Comments
 (0)