|
114 | 114 | "# before starting jupyter notebook to provide the password for the user \"neo4j\". \n", |
115 | 115 | "# It is not recommended to hardcode the password into jupyter notebook for security reasons.\n", |
116 | 116 | "\n", |
117 | | - "driver = GraphDatabase.driver(uri=\"bolt://localhost:7687\", auth=(\"neo4j\", os.environ.get(\"NEO4J_INITIAL_PASSWORD\")))\n", |
| 117 | + "driver = GraphDatabase.driver(uri=\"bolt://localhost:7687\", auth=(\"neo4j\", os.environ.get(\"NEO4J_INITIAL_PASSWORD\"))) # pyright: ignore[reportArgumentType]\n", |
118 | 118 | "driver.verify_connectivity()" |
119 | 119 | ] |
120 | 120 | }, |
|
131 | 131 | " \n", |
132 | 132 | "\n", |
133 | 133 | "def query_cypher_to_data_frame(filename, parameters_: typ.Optional[typ.Dict[str, typ.Any]] = None):\n", |
134 | | - " records, summary, keys = driver.execute_query(get_cypher_query_from_file(filename),parameters_=parameters_)\n", |
| 134 | + " records, summary, keys = driver.execute_query(get_cypher_query_from_file(filename),parameters_=parameters_) # type: ignore\n", |
135 | 135 | " return pd.DataFrame([r.values() for r in records], columns=keys)\n", |
136 | 136 | "\n", |
137 | 137 | "\n", |
|
173 | 173 | " The number of the dimensions and therefore size of the resulting array of floating point numbers\n", |
174 | 174 | " \"\"\"\n", |
175 | 175 | " \n", |
176 | | - " is_data_missing=query_cypher_to_data_frame(\"../cypher/Dependencies_Projection/Dependencies_0_Check_Projectable.cypher\", parameters).empty\n", |
| 176 | + " is_data_missing=query_cypher_to_data_frame(\"../../../cypher/Dependencies_Projection/Dependencies_0_Check_Projectable.cypher\", parameters).empty\n", |
177 | 177 | " if is_data_missing: return False\n", |
178 | 178 | "\n", |
179 | | - " query_cypher_to_data_frame(\"../cypher/Dependencies_Projection/Dependencies_1_Delete_Projection.cypher\", parameters)\n", |
180 | | - " query_cypher_to_data_frame(\"../cypher/Dependencies_Projection/Dependencies_2_Delete_Subgraph.cypher\", parameters)\n", |
| 179 | + " query_cypher_to_data_frame(\"../../../cypher/Dependencies_Projection/Dependencies_1_Delete_Projection.cypher\", parameters)\n", |
| 180 | + " query_cypher_to_data_frame(\"../../../cypher/Dependencies_Projection/Dependencies_2_Delete_Subgraph.cypher\", parameters)\n", |
181 | 181 | " # To include the direction of the relationships use the following line to create the projection:\n", |
182 | | - " # query_cypher_to_data_frame(\"../cypher/Dependencies_Projection/Dependencies_3_Create_Projection.cypher\", parameters)\n", |
183 | | - " query_cypher_to_data_frame(\"../cypher/Dependencies_Projection/Dependencies_4_Create_Undirected_Projection.cypher\", parameters)\n", |
184 | | - " query_cypher_to_data_frame(\"../cypher/Dependencies_Projection/Dependencies_5_Create_Subgraph.cypher\", parameters)\n", |
| 182 | + " # query_cypher_to_data_frame(\"../../../cypher/Dependencies_Projection/Dependencies_3_Create_Projection.cypher\", parameters)\n", |
| 183 | + " query_cypher_to_data_frame(\"../../../cypher/Dependencies_Projection/Dependencies_4_Create_Undirected_Projection.cypher\", parameters)\n", |
| 184 | + " query_cypher_to_data_frame(\"../../../cypher/Dependencies_Projection/Dependencies_5_Create_Subgraph.cypher\", parameters)\n", |
185 | 185 | " return True" |
186 | 186 | ] |
187 | 187 | }, |
|
204 | 204 | " parameters = dict(\n", |
205 | 205 | " dependencies_projection=projection_name,\n", |
206 | 206 | " )\n", |
207 | | - " return query_cypher_to_data_frame(\"../cypher/Dependencies_Projection/Dependencies_12_Get_Projection_Statistics.cypher\", parameters)\n", |
| 207 | + " return query_cypher_to_data_frame(\"../../../cypher/Dependencies_Projection/Dependencies_12_Get_Projection_Statistics.cypher\", parameters)\n", |
208 | 208 | "\n", |
209 | 209 | "\n", |
210 | 210 | "def get_projected_graph_node_count(projection_name: str) -> int:\n", |
|
275 | 275 | " print(\"No projected data for node embeddings calculation available\")\n", |
276 | 276 | " return empty_embeddings()\n", |
277 | 277 | "\n", |
278 | | - " existing_embeddings_query_filename=\"../cypher/Node_Embeddings/Node_Embeddings_0a_Query_Calculated.cypher\"\n", |
| 278 | + " existing_embeddings_query_filename=\"../queries/node-embeddings/Node_Embeddings_0a_Query_Calculated.cypher\"\n", |
279 | 279 | " embeddings = query_first_non_empty_cypher_to_data_frame(existing_embeddings_query_filename, cypher_file_name, parameters=parameters)\n", |
280 | 280 | " display(embeddings.head()) # Display the first entries of the table\n", |
281 | 281 | " return embeddings" |
|
315 | 315 | " print(\"GraphSAGE node embeddings training will be skipped for \" + str(node_count) + \" (>500) nodes, since it is computationally expensive and not eagerly needed for demonstration purposes.\")\n", |
316 | 316 | " return empty_embeddings()\n", |
317 | 317 | "\n", |
318 | | - " query_cypher_to_data_frame(\"../cypher/Node_Embeddings/Node_Embeddings_0b_Prepare_Degree.cypher\", parameters)\n", |
319 | | - " query_cypher_to_data_frame(\"../cypher/Node_Embeddings/Node_Embeddings_0c_Drop_Model.cypher\", parameters)\n", |
320 | | - " display(query_cypher_to_data_frame(\"../cypher/Node_Embeddings/Node_Embeddings_4b_GraphSAGE_Train.cypher\", parameters))\n", |
321 | | - " embeddings=query_cypher_to_data_frame(\"../cypher/Node_Embeddings/Node_Embeddings_4d_GraphSAGE_Stream.cypher\", parameters)\n", |
| 318 | + " query_cypher_to_data_frame(\"../queries/node-embeddings/Node_Embeddings_0b_Prepare_Degree.cypher\", parameters)\n", |
| 319 | + " query_cypher_to_data_frame(\"../queries/node-embeddings/Node_Embeddings_0c_Drop_Model.cypher\", parameters)\n", |
| 320 | + " display(query_cypher_to_data_frame(\"../queries/node-embeddings/Node_Embeddings_4b_GraphSAGE_Train.cypher\", parameters))\n", |
| 321 | + " embeddings=query_cypher_to_data_frame(\"../queries/node-embeddings/Node_Embeddings_4d_GraphSAGE_Stream.cypher\", parameters)\n", |
322 | 322 | " \n", |
323 | 323 | " display(embeddings.head()) # Display the first entries of the table\n", |
324 | 324 | " return embeddings" |
|
707 | 707 | " \"dependencies_projection_write_property\": \"embeddingsFastRandomProjection\",\n", |
708 | 708 | " \"dependencies_projection_embedding_dimension\":\"32\"\n", |
709 | 709 | "}\n", |
710 | | - "embeddings_fastRP = create_node_embeddings(\"../cypher/Node_Embeddings/Node_Embeddings_1d_Fast_Random_Projection_Stream.cypher\", java_package_embeddings_parameters)\n" |
| 710 | + "embeddings_fastRP = create_node_embeddings(\"../queries/node-embeddings/Node_Embeddings_1d_Fast_Random_Projection_Stream.cypher\", java_package_embeddings_parameters)\n" |
711 | 711 | ] |
712 | 712 | }, |
713 | 713 | { |
|
777 | 777 | " \"dependencies_projection_write_property\": \"embeddingsHashGNN\",\n", |
778 | 778 | " \"dependencies_projection_embedding_dimension\":\"64\"\n", |
779 | 779 | "}\n", |
780 | | - "embeddings_hashGNN = create_node_embeddings(\"../cypher/Node_Embeddings/Node_Embeddings_2d_Hash_GNN_Stream.cypher\", java_package_embeddings_parameters)\n", |
| 780 | + "embeddings_hashGNN = create_node_embeddings(\"../queries/node-embeddings/Node_Embeddings_2d_Hash_GNN_Stream.cypher\", java_package_embeddings_parameters)\n", |
781 | 781 | "embeddings_hashGNN = prepare_node_embeddings_for_2d_visualization(embeddings_hashGNN)\n", |
782 | 782 | "scores_hashGNN = CommunityScores.calculate(embeddings_hashGNN)\n", |
783 | 783 | "plot_2d_node_embeddings(embeddings_hashGNN, get_plot_title(\"Java Packages\", \"HashGNN\", scores_hashGNN))" |
|
803 | 803 | " \"dependencies_projection_write_property\": \"embeddingsNode2Vec\",\n", |
804 | 804 | " \"dependencies_projection_embedding_dimension\":\"32\"\n", |
805 | 805 | "}\n", |
806 | | - "embeddings_node2vec = create_node_embeddings(\"../cypher/Node_Embeddings/Node_Embeddings_3d_Node2Vec_Stream.cypher\", java_package_embeddings_parameters)\n", |
| 806 | + "embeddings_node2vec = create_node_embeddings(\"../queries/node-embeddings/Node_Embeddings_3d_Node2Vec_Stream.cypher\", java_package_embeddings_parameters)\n", |
807 | 807 | "embeddings_node2vec = prepare_node_embeddings_for_2d_visualization(embeddings_node2vec)\n", |
808 | 808 | "scores_node2vec = CommunityScores.calculate(embeddings_node2vec)\n", |
809 | 809 | "plot_2d_node_embeddings(embeddings_node2vec, get_plot_title(\"Java Packages\", \"node2vec\", scores_node2vec))" |
|
0 commit comments