VariantSync
diff --git a/‎docker/entrypoint.sh‎
Lines changed: 6 additions & 6 deletions b/‎docker/entrypoint.sh‎
Lines changed: 6 additions & 6 deletions
diff --git a/‎docker/fix-perms.sh‎
Lines changed: 9 additions & 9 deletions b/‎docker/fix-perms.sh‎
Lines changed: 9 additions & 9 deletions
diff --git a/‎docs/replication/create-forks-on-github.sh‎
Lines changed: 37 additions & 37 deletions b/‎docs/replication/create-forks-on-github.sh‎
Lines changed: 37 additions & 37 deletions
diff --git a/‎linegraph/createGraph.py‎
Lines changed: 13 additions & 13 deletions b/‎linegraph/createGraph.py‎
Lines changed: 13 additions & 13 deletions
diff --git a/‎linegraph/graphGeneration.py‎
Lines changed: 1 addition & 1 deletion b/‎linegraph/graphGeneration.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎linegraph/lattice/.gitignore‎
Lines changed: 1 addition & 1 deletion b/‎linegraph/lattice/.gitignore‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎linegraph/renderMultilinemacros.sh‎
Lines changed: 1 addition & 1 deletion b/‎linegraph/renderMultilinemacros.sh‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎linegraph/renderPatterns.sh‎
Lines changed: 1 addition & 1 deletion b/‎linegraph/renderPatterns.sh‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎mining/bisect_threshold_search.py‎
Lines changed: 25 additions & 25 deletions b/‎mining/bisect_threshold_search.py‎
Lines changed: 25 additions & 25 deletions
@@ -1,9 +1,9 @@
 #!/bin/sh
 if [ "$(id -u)" = "0" ]; then
-  # running on a developer laptop as root
-  fix-perms -r -u user -g user /home/user
-  exec gosu user "$@"
+    # running on a developer laptop as root
+    fix-perms -r -u user -g user /home/user
+    exec gosu user "$@"
 else
-  # running in production as a user
-  exec "$@"
-fi
+    # running in production as a user
+    exec "$@"
+fi
@@ -1,12 +1,12 @@
 # update the uid
 if [ -n "$opt_u" ]; then
-  OLD_UID=$(getent passwd "${opt_u}" | cut -f3 -d:)
-  NEW_UID=$(stat -c "%u" "$1")
-  if [ "$OLD_UID" != "$NEW_UID" ]; then
-    echo "Changing UID of $opt_u from $OLD_UID to $NEW_UID"
-    usermod -u "$NEW_UID" -o "$opt_u"
-    if [ -n "$opt_r" ]; then
-      find / -xdev -user "$OLD_UID" -exec chown -h "$opt_u" {} \;
+    OLD_UID=$(getent passwd "${opt_u}" | cut -f3 -d:)
+    NEW_UID=$(stat -c "%u" "$1")
+    if [ "$OLD_UID" != "$NEW_UID" ]; then
+        echo "Changing UID of $opt_u from $OLD_UID to $NEW_UID"
+        usermod -u "$NEW_UID" -o "$opt_u"
+        if [ -n "$opt_r" ]; then
+            find / -xdev -user "$OLD_UID" -exec chown -h "$opt_u" {} \;
+        fi
     fi
-  fi
-fi
+fi
@@ -10,22 +10,22 @@ DRY_RUN=n
 #DRY_RUN=n
 
 continue-with() {
-  echo
-  read -p "Do you want to continue with $1? [y/N] " answer
-  [ "$answer" == "y" ]
+    echo
+    read -p "Do you want to continue with $1? [y/N] " answer
+    [ "$answer" == "y" ]
 }
 
 run() {
-  echo
-  echo "\$ $*"
-  if [ "$DRY_RUN" = "n" ]
-  then
-    "$@"
-  fi
+    echo
+    echo "\$ $*"
+    if [ "$DRY_RUN" = "n" ]
+    then
+        "$@"
+    fi
 }
 
 repos() {
-  find "$PATH_TO_REPOSITORIES" -mindepth 1 -maxdepth 1 -type d "$@"
+    find "$PATH_TO_REPOSITORIES" -mindepth 1 -maxdepth 1 -type d "$@"
 }
 
 PATH_TO_REPOSITORIES="$(realpath "$PATH_TO_REPOSITORIES")"
@@ -36,49 +36,49 @@ continue-with "these $(repos -print0 | tr -d -c '\0' | tr '\0' '\n' | wc -l) rep
 
 if gh auth status |& grep -q 'You are not logged into any GitHub hosts.' &>/dev/null
 then
-  run gh auth login || exit 1
-  was_logged_in=0
+    run gh auth login || exit 1
+    was_logged_in=0
 else
-  echo
-  gh auth status
+    echo
+    gh auth status
 
-  continue-with "this account" ||
-  {
-    run gh auth logout &&
-    run gh auth login || exit 1
-  }
-  was_logged_in=1
+    continue-with "this account" ||
+    {
+        run gh auth logout &&
+        run gh auth login || exit 1
+    }
+    was_logged_in=1
 fi
 
 repos -print0 |
 while IFS= read -d '' -r repository
 do
-  echo
-  run cd "$repository"
-  url="$(git remote get-url origin)"
-  if [[ "$url" =~ github.com ]]
-  then
-    echo "$repository is a github repo"
-    run gh repo fork --remote || echo "already forked"
-    run git push -f origin
-  else
-    echo "$repository is not a github repo"
-    run git remote rename origin upstream &>/dev/null
-    run gh repo create "DiffDetective/$(basename "$repository")" -d "Fork of $url" --push --public --source .
-  fi
-  echo "repo succesful"
+    echo
+    run cd "$repository"
+    url="$(git remote get-url origin)"
+    if [[ "$url" =~ github.com ]]
+    then
+        echo "$repository is a github repo"
+        run gh repo fork --remote || echo "already forked"
+        run git push -f origin
+    else
+        echo "$repository is not a github repo"
+        run git remote rename origin upstream &>/dev/null
+        run gh repo create "DiffDetective/$(basename "$repository")" -d "Fork of $url" --push --public --source .
+    fi
+    echo "repo succesful"
 done
 
 if [ "$was_logged_in" = "1" ]
 then
-  cat <<EOF
+    cat <<EOF
 
 Warning: 'gh' is still logged in, to log out use
 
     gh auth logout
 
 EOF
 else
-  echo
-  run gh auth logout
+    echo
+    run gh auth logout
 fi
@@ -12,7 +12,7 @@
 # Add arguments, such as
 #     --patterns_path     path to the patterns file (default: ../lattice/patterns.lg)
 #     --lattice_path      path to the lattice file (default: ../lattice/lattice.lg)
-#     --node_parser       (default|patternsdebug|patternsrelease) 
+#     --node_parser       (default|patternsdebug|patternsrelease)
 #                         how the node labels in the patterns file should be interpreted
 ####################################################################
 
@@ -81,26 +81,26 @@ def patterns(patterns_file_path):
     for line in patternLines:
         line = line.replace("\n", "")
         line = line.replace("\r", "")
-        
+
         if line.startswith("t"):
             # save previous read tree
             if len(nodes):
                 trees.update({tree : (nodes.copy(), edges.copy())})
                 drawCluster(tree, nodes, edges)
-            
+
             # read new tree (and clear all nodes and edges)
             nodes.clear()
             edges.clear()
             # t # TREE_ID
             lineParams = line.split(" ")
             tree = lineParams[2]
-            
+
         # read in node
         elif line.startswith("v"):
             # v ID LABEL
             lineParams = line.split(" ")
             nodes.append((lineParams[1], ' '.join(lineParams[2:])))
-        
+
         # read in edge
         elif line.startswith("e"):
             # e NODE_CHILD_ID NODE_PARENT_ID LABEL
@@ -123,17 +123,17 @@ def lattice(lattice_file_path):
     for line in latticeLines:
         line = line.replace("\n", "")
         line = line.replace("\r", "")
-        
+
         if line.startswith("t"):
             # t # TREE_ID
             pass
-        
+
         elif line.startswith("v"):
             # v ID LABEL
             lineParams = line.split(" ")
             latticeNodes.update({lineParams[1]: lineParams[2]})
 
-            
+
         elif line.startswith("e"):
             # e NODE_CHILD_ID NODE_PARENT_ID LABEL
             lineParams = line.split(" ")
@@ -152,10 +152,10 @@ def main():
     argparser.add_argument('--lattice_path', nargs='?', default="../lattice/lattice.lg", type=str)
     argparser.add_argument('--node_parser', nargs='?', default="patternsrelease", type=str)
     args = argparser.parse_args()
-    
+
     patterns_path = args.patterns_path
     lattice_path = args.lattice_path
-    
+
     # select the node parser
     global NODE_PARSER # accessing the gloabl variable NODE_PARSER
     if args.node_parser == "default":
@@ -170,12 +170,12 @@ def main():
     #d.attr(rankdir='LR')
     d.attr(overlap='false')
     #d.attr(compound='true')
-    
+
     d.attr(sep = "+10")
-    
+
     patterns(patterns_path)
     lattice(lattice_path)
-    
+
     d.view()
 
 
 
@@ -237,4 +237,4 @@ def edgeColour(edge):
     elif edge.startswith("b"):
         return EDGE_REM_COLOR
     else:
-        raise Exception("Cannot parse edge label " + edge)
+        raise Exception("Cannot parse edge label " + edge)
@@ -1 +1 @@
-*.gv 
+*.gv
@@ -1,2 +1,2 @@
 # Run in project root
-.venv/bin/python3 linegraph/renderLinegraph.py "src/test/resources/multilinemacros/gen"
+.venv/bin/python3 linegraph/renderLinegraph.py "src/test/resources/multilinemacros/gen"
@@ -1,2 +1,2 @@
 #!/usr/bin/env bash
-python3 renderLinegraph.py --pattern --atomics --fontsize 7 "/mnt/c/Users/Paul Bittner/Documents/MyDocuments/Paper/Notes/Papers/VariabilityEditPatternMining/Results/Patterns/$1"
+python3 renderLinegraph.py --pattern --atomics --fontsize 7 "/mnt/c/Users/Paul Bittner/Documents/MyDocuments/Paper/Notes/Papers/VariabilityEditPatternMining/Results/Patterns/$1"
@@ -15,46 +15,46 @@ def bisect_threshold(lib_path, data_path, target_count=500):
     The input directory should contain the graph database as .lg file, the number of graphs in the file as .count file.
     It is assumed, that the count files are enumerated the same way as the graph databases, so that a lexicographic sorting gives matching files.'''
     target_count = int(target_count)
-    
+
     # First check, that we have as many count-files as graph files.
     db_files = sorted([file_name for file_name in os.listdir(data_path) if file_name.endswith('.aids')])
     count_files = sorted([file_name for file_name in os.listdir(data_path) if file_name.endswith('.count')])
     assert len(db_files) == len(count_files)
-    
-    
+
+
     for idx, in_file in enumerate(db_files):
         match_filename = re.match(regex_count_file, in_file)
-        
+
         if not match_filename:
             assert False, "Filename for db_size not formatted as expected."
-        
-        
+
+
         database_id = int(match_filename.group(1))
-        
-        
+
+
         t_max = get_db_size(data_path + count_files[idx])
         t_min = 2
-        
+
         # Bisection to find a heuristically good threshold
         while t_max - t_min > 1:
             t = (t_max + t_min) // 2
             found_patterns = run_approximate(lib_path, data_path + in_file, data_path + 'frequent_temp.cstring', t)
-            
+
             if found_patterns >= target_count:
-                t_min = t	
+                t_min = t
             else:
                 t_max = t
-                
+
 
         # Write found threshold to file
         with open(data_path +  str(database_id) + '.threshold', 'w') as f:
-            f.write(str(t))   
-       
-    
+            f.write(str(t))
+
+
 def get_db_size(file_name):
     with open(file_name) as f:
         return int(f.read())
-    
+
 def count_subgraphs(subgraph_file):
     ''' Assume a AIDS format. In this format, every graph is represented by 3 lines.'''
     i = None
@@ -65,34 +65,34 @@ def count_subgraphs(subgraph_file):
         return ceil((i + 1) / 3)
     else:
         return 0
-    
+
 def run_approximate(lib_path, input_file, output_file, threshold):
     ''' We fix the maximum length to l, i.e., we are mining patterns at most l nodes large. '''
-    
+
     # Run HOPS approximate subgraph miner
     lwg_cmd_template = "'{lib_path}lwg' -t {threshold} -p 8 -e hops -i 5 '{input_file}' -o '{output_file}'"
     miner_cmd = lwg_cmd_template.format(lib_path=lib_path, input_file=input_file, output_file=output_file, threshold=threshold)
-        
+
     p = subprocess.Popen(miner_cmd, shell=True)
-       
+
     try:
         p.wait(30)  # Should take at most 30 seconds
     except Exception as e:
         print(str(e))
-        p.kill()    
-        
+        p.kill()
+
     # transform output file (so that we can easier count the number of patterns later
     cstring_cmd = "cat " + output_file + " | xargs -I {} bash -c \"echo '{}' | '" + lib_path + "cstring' -i -\"  > " + output_file + ".tmp"
-    
+
     subprocess.run(cstring_cmd, shell = True)
 
     #os.remove(output_file)
     nb_subgraphs = count_subgraphs(output_file+".tmp")
     #os.remove(output_file+".tmp")
     return nb_subgraphs
-    
+
 if __name__ == "__main__":
     if len(sys.argv) == 4:
-        bisect_threshold(sys.argv[1], sys.argv[2], target_count = sys.argv[3])	
+        bisect_threshold(sys.argv[1], sys.argv[2], target_count = sys.argv[3])
     else:
         print("Unexpected number of arguments. Run as python bisect_threshold_search.py [lib_path] [data_path] [target_count]. lwg and cstring tool binaries need to be located in the lib_path. Data directiory is expected to contain .lg line graph databases and .count files with the number of graphs in the corresponding database.")
Original file line number	Diff line number	Diff line change
`@@ -1,2 +1,2 @@`
`1`	`1`	`# Run in project root`
`2`		`-.venv/bin/python3 linegraph/renderLinegraph.py "src/test/resources/multilinemacros/gen"`
	`2`	`+.venv/bin/python3 linegraph/renderLinegraph.py "src/test/resources/multilinemacros/gen"`
Original file line number	Diff line number	Diff line change
`@@ -1,2 +1,2 @@`
`1`	`1`	`#!/usr/bin/env bash`
`2`		`-python3 renderLinegraph.py --pattern --atomics --fontsize 7 "/mnt/c/Users/Paul Bittner/Documents/MyDocuments/Paper/Notes/Papers/VariabilityEditPatternMining/Results/Patterns/$1"`
	`2`	`+python3 renderLinegraph.py --pattern --atomics --fontsize 7 "/mnt/c/Users/Paul Bittner/Documents/MyDocuments/Paper/Notes/Papers/VariabilityEditPatternMining/Results/Patterns/$1"`