tigergraph
diff --git a/‎algorithms/.DS_Store
-6 KB b/‎algorithms/.DS_Store
-6 KB
diff --git a/‎algorithms/Centrality/article_rank/tg_algo_article_rank.yml
+1-1 b/‎algorithms/Centrality/article_rank/tg_algo_article_rank.yml
+1-1
diff --git a/‎algorithms/Centrality/betweenness/tg_algo_betweenness_cent.yml
+1-1 b/‎algorithms/Centrality/betweenness/tg_algo_betweenness_cent.yml
+1-1
diff --git a/‎algorithms/Centrality/closeness/approximate/tg_algo_closeness_cent_approx.yml
+1-1 b/‎algorithms/Centrality/closeness/approximate/tg_algo_closeness_cent_approx.yml
+1-1
diff --git a/‎algorithms/Centrality/closeness/exact/tg_algo_closeness_cent.yml
+2-2 b/‎algorithms/Centrality/closeness/exact/tg_algo_closeness_cent.yml
+2-2
diff --git a/‎algorithms/Centrality/closeness/tg_sub_closeness.yml
+1-1 b/‎algorithms/Centrality/closeness/tg_sub_closeness.yml
+1-1
diff --git a/‎algorithms/Centrality/degree/tg_algo_degree_cent.yml
+2-2 b/‎algorithms/Centrality/degree/tg_algo_degree_cent.yml
+2-2
diff --git a/‎algorithms/Centrality/eigenvector/tg_algo_eigenvector.yml
+2-2 b/‎algorithms/Centrality/eigenvector/tg_algo_eigenvector.yml
+2-2
diff --git a/‎algorithms/Centrality/harmonic/tg_algo_harmonic_cent.yml
+2-2 b/‎algorithms/Centrality/harmonic/tg_algo_harmonic_cent.yml
+2-2
diff --git a/‎algorithms/Centrality/influence_maximization/CELF/tg_algo_influence_maximization_CELF.yml
+1-1 b/‎algorithms/Centrality/influence_maximization/CELF/tg_algo_influence_maximization_CELF.yml
+1-1
diff --git a/‎algorithms/Centrality/influence_maximization/greedy/tg_algo_influence_maximization_greedy.yml
+1-1 b/‎algorithms/Centrality/influence_maximization/greedy/tg_algo_influence_maximization_greedy.yml
+1-1
diff --git a/‎algorithms/Centrality/influence_maximization/tg_sub_influence_maximization.yml
+1-1 b/‎algorithms/Centrality/influence_maximization/tg_sub_influence_maximization.yml
+1-1
diff --git a/‎algorithms/Centrality/pagerank/global/tg_sub_pagerank_global.yml
+1-1 b/‎algorithms/Centrality/pagerank/global/tg_sub_pagerank_global.yml
+1-1
diff --git a/‎algorithms/Centrality/pagerank/global/unweighted/tg_algo_pagerank.yml
+1-1 b/‎algorithms/Centrality/pagerank/global/unweighted/tg_algo_pagerank.yml
+1-1
diff --git a/‎algorithms/Centrality/pagerank/global/weighted/tg_algo_pagerank_wt.yml
+2-2 b/‎algorithms/Centrality/pagerank/global/weighted/tg_algo_pagerank_wt.yml
+2-2
diff --git a/‎algorithms/Centrality/pagerank/personalized/all_pairs/tg_algo_pagerank_pers_ap_batch.yml
+1-1 b/‎algorithms/Centrality/pagerank/personalized/all_pairs/tg_algo_pagerank_pers_ap_batch.yml
+1-1
diff --git a/‎algorithms/Centrality/pagerank/personalized/multi_source/tg_algo_pagerank_pers.yml
+1-1 b/‎algorithms/Centrality/pagerank/personalized/multi_source/tg_algo_pagerank_pers.yml
+1-1
diff --git a/‎algorithms/Centrality/pagerank/tg_sub_pagerank.yml
+2-1 b/‎algorithms/Centrality/pagerank/tg_sub_pagerank.yml
+2-1
diff --git a/‎algorithms/Centrality/tg_category_centrality.yml
+1-1 b/‎algorithms/Centrality/tg_category_centrality.yml
+1-1
diff --git a/‎algorithms/Classification/greedy_graph_coloring/tg_algo_greedy_graph_coloring.yml
+1-1 b/‎algorithms/Classification/greedy_graph_coloring/tg_algo_greedy_graph_coloring.yml
+1-1
diff --git a/‎algorithms/Classification/k_nearest_neighbors/all_pairs/tg_algo_knn_cosine_all.yml
+2-1 b/‎algorithms/Classification/k_nearest_neighbors/all_pairs/tg_algo_knn_cosine_all.yml
+2-1
diff --git a/‎algorithms/Classification/k_nearest_neighbors/cross_validation/tg_algo_knn_cosine_cv.yml
+2-1 b/‎algorithms/Classification/k_nearest_neighbors/cross_validation/tg_algo_knn_cosine_cv.yml
+2-1
diff --git a/‎algorithms/Classification/k_nearest_neighbors/single_source/tg_algo_knn_cosine_ss.yml
+2-1 b/‎algorithms/Classification/k_nearest_neighbors/single_source/tg_algo_knn_cosine_ss.yml
+2-1
diff --git a/‎algorithms/Classification/k_nearest_neighbors/tg_sub_k_nearest_neighbors.yml
+1-1 b/‎algorithms/Classification/k_nearest_neighbors/tg_sub_k_nearest_neighbors.yml
+1-1
diff --git a/‎algorithms/Classification/maximal_independent_set/deterministic/tg_algo_maximal_indep_set.yml
+1-1 b/‎algorithms/Classification/maximal_independent_set/deterministic/tg_algo_maximal_indep_set.yml
+1-1
@@ -10,7 +10,7 @@
     name: Article Rank
     filename: "tg_article_rank.gsql"
     sha_id: ed6ea869749977cc0f3df71225d7325fb81c9767
-    description: ArticleRank is an algorithm that has been derived from the PageRank algorithm to measure the influence of journal articles. PageRank assumes that relationships originating from low-degree nodes have a higher influence than relationships from high-degree nodes. Article Rank modifies the formula in such a way that it retains the basic PageRank methodology but lowers the influence of low-degree nodes.
+    description: "Measures the influence of vertices in a graph. ArticleRank retains the basic PageRank methodology but lowers the influence of low-degree nodes."
     schema_constraints: If you want to write the results of this algorithm (FLOAT) back to the vertices, you must have a FLOAT attribute on the target vertex type.
     version: lib3.0
     include: true
@@ -10,7 +10,7 @@
     name: Betweenness Centrality
     filename: "tg_betweenness_cent.gsql"
     sha_id: ed6ea869749977cc0f3df71225d7325fb81c9767
-    description: The Betweenness Centrality of a vertex is defined as the number of shortest paths that pass through this vertex, divided by the total number of shortest paths.
+    description: "Calculates the betweenness centrality of vertices in a graph."
     schema_constraints: If you want to write the results of this algorithm (FLOAT) back to the vertices, you must have a FLOAT attribute on the target vertex type.
     version: lib3.0
     include: true
@@ -10,6 +10,6 @@
     name: Approximate Closeness Centrality
     filename: "tg_closeness_cent_approx.gsql"
     sha_id: ed6ea869749977cc0f3df71225d7325fb81c9767
-    description: The Approximate Closeness Centrality algorithm (based on Cohen et al. 2014) calculates the approximate closeness centrality score for each vertex by combining two estimation approaches - sampling and pivoting. This hybrid estimation approach offers near-linear time processing and linear space overhead within a small relative error. It runs on graphs with unweighted edges (directed or undirected).
+    description: "Calculates the approximate closeness centrality score for each vertex. This algorithm offers near-linear time processing and linear space overhead within a small relative error."
     version: lib3.0
     include: true
@@ -10,7 +10,7 @@
     name: Closeness Centrality
     filename: "tg_closeness_cent.gsql"
     sha_id: ed6ea869749977cc0f3df71225d7325fb81c9767
-    description: TigerGraph’s closeness centrality algorithm uses multi-source breadth-first search (MS-BFS) to traverse the graph and calculate the sum of a vertex’s distance to every other vertex in the graph, which vastly improves the performance of the algorithm.
-    schema_constraints: If you want to write the results of this algorithm (FLOAT) back to the vertices, you must have a FLOAT attribute on the target vertex type.
+    description: "Calculates the exact closeness centrality of an algorithm. This algorithm might be time-consuming on large graphs when compared to the approximate version."
+    schema_constraints: If you want to write the results of this algorithm (FLOAT) back to the vertices, the target vertex type must have a FLOAT attribute.
     version: lib3.0
     include: true
@@ -1,2 +1,2 @@
 ---
-  description: The closeness centrality score is calculated as the inverse of the average of distances from each vertex to every other vertex in the graph. TigerGraph offers an exact and approximate version. 
+  description: "Calculates the closeness centrality of vertices in a graph. TigerGraph offers different algorithms that calculate approximate or exact closeness centrality."
@@ -10,7 +10,7 @@
     name: Degree Centrality
     filename: "tg_degree_cent.gsql"
     sha_id: ed6ea869749977cc0f3df71225d7325fb81c9767
-    description: Degree centrality is defined as the number of edges incident upon a node (i.e., the number of ties that a node has). The degree can be interpreted in terms of the immediate risk of a node for catching whatever is flowing through the network (such as a virus, or some information).
-    schema_constraints: If you want to write the results of this algorithm (FLOAT) back to the vertices, you must have a FLOAT attribute on the target vertex type.
+    description: "Calculates the degree centrality of vertices in a graph."
+    schema_constraints: If you want to write the results of this algorithm (FLOAT) back to the vertices, the target vertex type must have a FLOAT attribute.
     version: lib3.0
     include: true
@@ -10,7 +10,7 @@
     name: Eigenvector Centrality
     filename: "tg_eigenvector_cent.gsql"
     sha_id: ed6ea869749977cc0f3df71225d7325fb81c9767
-    description: Eigenvector centrality (also called eigencentrality or prestige score) is a measure of the influence of a vertex in a network. Relative scores are assigned to all vertices in the network based on the concept that connections to high-scoring vertices contribute more to the score of the vertex in question than equal connections to low-scoring vertices. A high eigenvector score means that a vertex is connected to many vertices who themselves have high scores.
-    schema_constraints: If you want to write the results of this algorithm (FLOAT) back to the vertices, you must have a FLOAT attribute on the target vertex type.
+    description: "Calculates the eigenvector centrality of vertices in a graph. A high eigenvector centrality score means that a vertex is connected to many vertices that themselves have high scores."
+    schema_constraints: If you want to write the results of this algorithm (FLOAT) back to the vertices, the target vertex type must have a FLOAT attribute.
     version: lib3.0
     include: true
@@ -10,7 +10,7 @@
     name: Harmonic Centrality
     filename: "tg_harmonic_cent.gsql"
     sha_id: ed6ea869749977cc0f3df71225d7325fb81c9767
-    description: The Harmonic Centrality algorithm calculates the harmonic centrality of each vertex in the graph. Harmonic Centrality is a variant of Closeness Centrality. In a (not necessarily connected) graph, the harmonic centrality reverses the sum and reciprocal operations in the definition of closeness centrality.
-    schema_constraints: If you want to write the results of this algorithm (FLOAT) back to the vertices, you must have a FLOAT attribute on the target vertex type.
+    description: "Calculates the harmonic centrality of each vertex in the graph. Harmonic centrality is a variant of closeness centrality."
+    schema_constraints: If you want to write the results of this algorithm (FLOAT) back to the vertices, the target vertex type must have a FLOAT attribute.
     version: lib3.0
     include: true
@@ -10,7 +10,7 @@
     name: Cost Effective Lazy Forward (CELF) Influence Maximization
     filename: "tg_influence_maximization_CELF.gsql"
     sha_id: ed6ea869749977cc0f3df71225d7325fb81c9767
-    description: Influence maximization is the problem of finding a small subset of vertices in a social network that could maximize the spread of influence. There are two versions of the Influence Maximization algorithm. Both versions find k vertices that maximize the expected spread of influence in the network. The CELF version improves upon the efficiency of the greedy version and should be preferred in analyzing large networks.
+    description: "This version is more efficient than the greedy version and should be preferred in analyzing large networks."
     schema_constraints: This algorithm also requires a FLOAT attribute on the target edge types representing weight or influence.
     version: lib3.0
     include: false
@@ -10,7 +10,7 @@
     name: Greedy Influence Maximization
     filename: "tg_influence_maximization_greedy.gsql"
     sha_id: ed6ea869749977cc0f3df71225d7325fb81c9767
-    description: Influence maximization is the problem of finding a small subset of vertices in a social network that could maximize the spread of influence. There are two versions of the Influence Maximization algorithm. Both versions find k vertices that maximize the expected spread of influence in the network.
+    description: "This version is more time-consuming than the CELF version."
     schema_constraints: This algorithm also requires a FLOAT attribute on the target edge types representing weight or influence.
     version: lib3.0
     include: false
@@ -1,2 +1,2 @@
 ---
-  description: The library is currently under construction! Descriptions will be added soon.
+  description: "Influence Maximization algorithms find a specified number of vertices that maximize the expected spread of influence in a network. The CELF version improves upon the efficiency of the greedy version and should be preferred in analyzing large networks."
@@ -1,2 +1,2 @@
 ---
-  description: The library is currently under construction! Descriptions will be added soon.
+  description: "In the global versions, the imaginary user can start browsing from any page as opposed to a specific set of pages."
@@ -10,7 +10,7 @@
     name: Pagerank
     filename: "tg_pagerank.gsql"
     sha_id: ed6ea869749977cc0f3df71225d7325fb81c9767
-    description: "The PageRank algorithm measures the influence of each vertex on every other vertex. PageRank influence is defined recursively: a vertex’s influence is based on the influence of the vertices which refer to it. A vertex’s influence tends to increase if (1) it has more referring vertices or if (2) its referring vertices have higher influence. The analogy to social influence is clear."
+    description: "Measures the influence of each vertex on every other vertex in a graph with unweighted edges"
     schema_constraints: If you want to write the results of this algorithm (FLOAT) back to the vertices, you must have a FLOAT attribute on the target vertex type.
     version: lib3.0
     include: true
@@ -10,7 +10,7 @@
     name: Weighted Pagerank
     filename: "tg_pagerank_wt.gsql"
     sha_id: ed6ea869749977cc0f3df71225d7325fb81c9767
-    description: "The PageRank algorithm measures the influence of each vertex on every other vertex. PageRank influence is defined recursively: a vertex’s influence is based on the influence of the vertices which refer to it. A vertex’s influence tends to increase if (1) it has more referring vertices or if (2) its referring vertices have higher influence. The analogy to social influence is clear. The only difference between weighted PageRank and standard PageRank is that edges have weights, and the influence that a vertex receives from an in-neighbor is multiplied by the weight of the in-edge."
-    schema_constraints: If you want to write the results of this algorithm (FLOAT) back to the vertices, you must have a FLOAT attribute on the target vertex type. This algorithm also requires a FLOAT attribute on the target edge types representing weight or influence.
+    description: "Measures the influence of each vertex on every other vertex in a graph with weighted edges. Multiplies a vertex's received influence by the weight of the in-edge."
+    schema_constraints: If you want to write the results of this algorithm (FLOAT) back to the vertices, the target vertex type must have a FLOAT attribute. This algorithm also requires a FLOAT attribute on the target edge types representing weight or influence.
     version: lib3.0
     include: true
@@ -10,6 +10,6 @@
     name: Personalized Pagerank (All Pairs, Batch)
     filename: "tg_pagerank_pers_ap_batch.gsql"
     sha_id: ed6ea869749977cc0f3df71225d7325fb81c9767
-    description: "The PageRank algorithm measures the influence of each vertex on every other vertex. PageRank influence is defined recursively: a vertex’s influence is based on the influence of the vertices which refer to it. A vertex’s influence tends to increase if (1) it has more referring vertices or if (2) its referring vertices have higher influence. The analogy to social influence is clear. In the original PageRank, the damping factor is the probability of the surfer continues browsing at each step. The surfer may also stop browsing and start again from a random vertex. In personalized PageRank, the surfer can only start browsing from a given set of source vertices both at the beginning and after stopping. "
+    description: "Calculates the personalized PageRank score starting from each vertex to every other vertex."
     version: lib3.0
     include: false
@@ -10,6 +10,6 @@
     name: Personalized Pagerank
     filename: "tg_pagerank_pers.gsql"
     sha_id: ed6ea869749977cc0f3df71225d7325fb81c9767
-    description: "The PageRank algorithm measures the influence of each vertex on every other vertex. PageRank influence is defined recursively: a vertex’s influence is based on the influence of the vertices which refer to it. A vertex’s influence tends to increase if (1) it has more referring vertices or if (2) its referring vertices have higher influence. The analogy to social influence is clear. In the original PageRank, the damping factor is the probability of the surfer continues browsing at each step. The surfer may also stop browsing and start again from a random vertex. In personalized PageRank, the surfer can only start browsing from a given set of source vertices both at the beginning and after stopping. "
+    description: "Calculates the personalized PageRank score starting from a specific set of source vertices."
     version: lib3.0
     include: false
@@ -1,2 +1,3 @@
 ---
-  description: The library is currently under construction! Descriptions will be added soon.
+  description: "Measures the influence of each vertex on every other vertex. 
+  PageRank influence is defined recursively: a vertex’s influence is based on the influence of the vertices which refer to it."
@@ -1,2 +1,2 @@
 ---
-  description: Centrality algorithms calculate the 'importance' of each vertex given a particular metric. These metrics generally revolve around density of a vertex's connectivity or the importance of that vertex to the general connectivity of the entire graph. Some widely used examples include Betweenness Centrality, which produces scores for vertices based on the number of shortest paths that they appear in and Closeness Centrality, which measures importance inversely proportional to how 'far' the vertex is away from every other vertex.
+  description: "Centrality algorithms calculate the 'importance' of each vertex given a particular metric. These metrics generally revolve around density of a vertex's connectivity or the importance of that vertex to the general connectivity of the entire graph. Some widely used examples include Betweenness Centrality, which produces scores for vertices based on the number of shortest paths that they appear in and Closeness Centrality, which measures importance inversely proportional to how 'far' the vertex is away from every other vertex."
@@ -10,6 +10,6 @@
     name: Greedy Graph Coloring
     filename: "tg_greedy_graph_coloring.gsql"
     sha_id: ed6ea869749977cc0f3df71225d7325fb81c9767
-    description: This algorithm assigns a unique integer value known as its color to the vertices of a graph such that no neighboring vertices share the same color. The reason why this is called color is that this task is equivalent to assigning a color to each nation on a map so that no neighboring nations share the same color.
+    description: "Assigns a unique integer value, known as 'color', to the vertices of a graph such that no neighboring vertices share the same color."
     version: lib3.0
     include: false
@@ -10,7 +10,8 @@
     name: K Nearest Neighbors (All Pairs)
     filename: "tg_knn_cosine_all.gsql"
     sha_id: ed6ea869749977cc0f3df71225d7325fb81c9767
-    description: The k-Nearest Neighbors (kNN) algorithm is one of the simplest classification algorithms. It assumes that some or all the vertices in the graph have already been classified. The classification is stored as an attribute called the label. The goal is to predict the label of a given vertex, by seeing what are the labels of the nearest vertices. This algorithm is a batch version of the k-Nearest Neighbors, Cosine Neighbor Similarity, single vertex. It makes a prediction for every vertex whose label is not known (i.e., the attribute for the known label is empty), based on its k nearest neighbors' labels.
+    description: "This algorithm makes a prediction for every vertex whose label is not known based on its k nearest neighbors' labels."
+    schema_constraints: "This algorithm requires a FLOAT attribute on the target edge types representing weight, and a STRING attribute representing the label."
     version: lib3.0
     include: false
     dependencies:
 
@@ -10,7 +10,8 @@
     name: K Nearest Neighbors (Cross Validation)
     filename: "tg_knn_cosine_cv.gsql"
     sha_id: ed6ea869749977cc0f3df71225d7325fb81c9767
-    description: k-Nearest Neighbors (kNN) is often used for machine learning. You can choose the value for topK based on your experience, or using cross-validation to optimize the hyperparameters. In our library, Leave-one-out cross-validation for selecting optimal k is provided. Given a k value, we run the algorithm repeatedly using every vertex with a known label as the source vertex and predict its label. We assess the accuracy of the predictions for each value of k, and then repeat for different values of k in the given range. The goal is to find the value of k with highest predicting accuracy in the given range, for that dataset.
+    description: "This algorithm runs the single source version repeatedly using every vertex with a known label as the source vertex and predicts its label. It assesses the accuracy of the predictions for each value of k, and then repeats for different values of k in the given range.  The goal is to find the value of k with highest predicting accuracy in the given range, for that dataset."
+    schema_constraints: "This algorithm requires a FLOAT attribute on the target edge types representing weight, and a STRING attribute representing the label."
     version: lib3.0
     include: false
     dependencies:
 
@@ -10,6 +10,7 @@
     name: K Nearest Neighbors (Single Source)
     filename: "tg_knn_cosine_ss.gsql"
     sha_id: ed6ea869749977cc0f3df71225d7325fb81c9767
-    description: The library is currently under construction! Descriptions will be added soon.
+    description: "This algorithm calculates the distance between a single source vertex and all other vertices and selects the k vertices that are nearest. "
+    schema_constraints: "This algorithm requires a FLOAT attribute on the target edge types representing weight, and a STRING attribute representing the label."
     version: lib3.0
     include: false
@@ -1,2 +1,2 @@
 ---
-  description: The library is currently under construction! Descriptions will be added soon.
+  description: "Predicts the label of a given vertex based on the labels of its nearest vertices. The label is a vertex attribute that stores the classification of a vertex. This algorithm assumes that the vertices have already been classified."
@@ -10,6 +10,6 @@
     name: Maximal Independent Set (Deterministic)
     filename: "tg_maximal_indep_set.gsql"
     sha_id: ed6ea869749977cc0f3df71225d7325fb81c9767
-    description: "An independent set of vertices does not contain any pair of vertices that are neighbors, i.e., ones which have an edge between them. A maximal independent set (MIS) is the largest independent set that contains those vertices; you cannot improve upon it unless you start over with a different independent set. However, the search for the largest possible independent set is an NP-hard problem: there is no known algorithm that can find that answer in polynomial time. So we settle for the maximal independent set. The deterministic version makes sure that you get the same results every time."
+    description: "The deterministic version of the MIS algorithm returns the same results every time it runs."
     version: lib3.0
     include: true
Original file line number	Diff line number	Diff line change
`@@ -1,2 +1,2 @@`
`1`	`1`	`---`
`2`		`- description: The closeness centrality score is calculated as the inverse of the average of distances from each vertex to every other vertex in the graph. TigerGraph offers an exact and approximate version.`
	`2`	`+ description: "Calculates the closeness centrality of vertices in a graph. TigerGraph offers different algorithms that calculate approximate or exact closeness centrality."`
Original file line number	Diff line number	Diff line change
`@@ -1,2 +1,2 @@`
`1`	`1`	`---`
`2`		`- description: The library is currently under construction! Descriptions will be added soon.`
	`2`	`+ description: "Influence Maximization algorithms find a specified number of vertices that maximize the expected spread of influence in a network. The CELF version improves upon the efficiency of the greedy version and should be preferred in analyzing large networks."`
Original file line number	Diff line number	Diff line change
`@@ -1,2 +1,2 @@`
`1`	`1`	`---`
`2`		- description: Centrality algorithms calculate the 'importance' of each vertex given a particular metric. These metrics generally revolve around density of a vertex's connectivity or the importance of that vertex to the general connectivity of the entire graph. Some widely used examples include Betweenness Centrality, which produces scores for vertices based on the number of shortest paths that they appear in and Closeness Centrality, which measures importance inversely proportional to how 'far' the vertex is away from every other vertex.
	`2`	+ description: "Centrality algorithms calculate the 'importance' of each vertex given a particular metric. These metrics generally revolve around density of a vertex's connectivity or the importance of that vertex to the general connectivity of the entire graph. Some widely used examples include Betweenness Centrality, which produces scores for vertices based on the number of shortest paths that they appear in and Closeness Centrality, which measures importance inversely proportional to how 'far' the vertex is away from every other vertex."