Update ACE run-experiments.jl and documentation.

emmanuellujan · emmanuellujan · commit 088ad5df5719 · 2022-08-25T22:25:49.000-04:00
diff --git a/docs/src/index.md b/docs/src/index.md
@@ -77,12 +77,12 @@ The input parameters are listed below:
 
 | Input parameter      | Description                                               | E.g.                |
 |----------------------|-----------------------------------------------------------|---------------------|
-| experiment_path      | Experiment path                                           | TiO2/               |
+| experiment_path      | Experiment path                                           | HfB2/               |
 | dataset_path         | Dataset path                                              | data/               |
-| trainingset_filename | Training datasets filename                                | TiO2trainingset.xyz |
-| testset_filename     | Test datasets filename                                    | TiO2testset.xyz     |
-| n_train_sys          | No. of atomic configurations in training dataset          | 80                  |
-| n_test_sys           | No. of atomic configurations in test dataset              | 20                  |
+| dataset_filename     | Dataset filename                                          | HfB2-n24-585.exyz   |
+| split_prop           | Split proportion. E.g. 0.8 training, 0.2 test.            | 0.8                 |
+| max_train_sys        | Max. no. of atomic systems in training dataset            | 800                 |
+| max_test_sys         | No. of atomic systems in test dataset                     | 200                 |
 | n_body               | Body order                                                | 3                   |
 | max_deg              | Maximum polynomial degree                                 | 3                   |
 | r0                   | An estimate on the nearest-neighbour distance for scaling | 1.0                 |
@@ -92,29 +92,30 @@ The input parameters are listed below:
 | w_e                  | Energy weight                                             | 1.0                 |
 | w_f                  | Force weight                                              | 1.0                 |
 
+
 Run fitting process
 
 ```shell
-    $ julia fit-ace.jl  experiment_path         TiO2/ \
-                        dataset_path            data/ \
-                        trainingset_filename    TiO2trainingset.xyz \
-                        testset_filename        TiO2testset.xyz \
-                        n_train_sys             80 \
-                        n_test_sys              20 \
-                        n_body                  3 \
-                        max_deg                 3 \
-                        r0                      1.0 \
-                        rcutoff                 5.0 \
-                        wL                      1.0 \
-                        csp                     1.0 \
-                        w_e                     1.0 \
-                        w_f                     1.0
+    $ julia --project=../../   fit-ace.jl   experiment_path       HfB2/ \
+                                            dataset_path          ../../../data/ \
+                                            dataset_filename      HfB2-n24-585.exyz \
+                                            split_prop            0.8 \
+                                            max_train_sys         800 \
+                                            max_test_sys          200 \
+                                            n_body                3 \
+                                            max_deg               3 \
+                                            r0                    1.0 \
+                                            rcutoff               5.0 \
+                                            wL                    1.0 \
+                                            csp                   1.0 \
+                                            w_e                   1.0 \
+                                            w_f                   1.0
 ```
 
 In addition, you can run the experiments with the default parameters (the parameters shown above).
 
 ```shell
-    $ julia fit-ace.jl
+    $ julia --project=../../ fit-ace.jl
 ```
 
 ### Run multiple fitting experiments in serial/parallel using the wrapper to ACE1.jl in InteratomicBasisPotentials.jl
@@ -134,7 +135,7 @@ Modify the file `run-experiments.jl` to specify the parameter ranges needed to g
 Run the script:
 
 ```shell
-    $ julia run-experiments.jl
+    $ julia --project=../../ run-experiments.jl
 ```
 
 Each experiment is run in a separate process (using `nohup` to facilitate its execution in a cluster).
@@ -148,11 +149,11 @@ After all experiments have been completed, run the following script to gather th
 ### Run an MD simulation using the wrapper to Molly.jl or NBodySimulator.jl in Atomistic.jl
 
 ```shell
-    $ run-md-ahfo2-ace-nbs.jl
+    $ julia --project=../../ run-md-ahfo2-ace-nbs.jl
 ```
 or
 ```shell
-    $ run-md-ahfo2-ace-molly.jl
+    $ julia --project=../../ run-md-ahfo2-ace-molly.jl
 ```
 (Note: currently there is a bug in the second script) 
 
@@ -166,21 +167,21 @@ or
 
 Open terminal and download Julia from https://julialang.org/downloads/
 ```shell
-    $ wget https://julialang-s3.julialang.org/bin/linux/x64/1.7/julia-1.7.3-linux-x86_64.tar.gz
+    $ wget https://julialang-s3.julialang.org/bin/linux/x64/1.8/julia-1.8.0-linux-x86_64.tar.gz
 ```
 Extract file
 ```shell
-    $ tar xvzf julia-1.7.3-linux-x86_64.tar.gz
+    $ tar xvzf julia-1.8.0-linux-x86_64.tar.gz
 ```
 Copy to `/opt` and create link
 ```shell
-    $ sudo mv  ./julia-1.7.3 /opt/
-    $ sudo ln -s /opt/julia-1.7.3/bin/julia /usr/local/bin/julia
+    $ sudo mv  ./julia-1.8.0 /opt/
+    $ sudo ln -s /opt/julia-1.8.0/bin/julia /usr/local/bin/julia
 ```
 Alternative: add line to `.shellrc`
 ```shell
     $ nano .shellrc
-    PATH=$PATH:/home/youruser/julia-1.7.3 /bin/
+    PATH=$PATH:/home/youruser/julia-1.8.0 /bin/
 ```
 Restart the terminal
 
@@ -204,4 +205,4 @@ Activate and instantiate
 ```julia
     pkg> activate .
     pkg> instantiate
-```
+```
diff --git a/workflows/ACE/fit-ace.jl b/workflows/ACE/fit-ace.jl
@@ -6,7 +6,7 @@ using LinearAlgebra
 
 
 # Load input parameters
-args = ["experiment_path",      "HfB2-33/",
+args = ["experiment_path",      "HfB2/",
         "dataset_path",         "../../../data/",
         "dataset_filename",     "HfB2-n24-585.exyz",
         "split_prop",           "0.8", # 80% training, 20% test.
diff --git a/workflows/ACE/run-experiments.jl b/workflows/ACE/run-experiments.jl
@@ -1,7 +1,7 @@
 # Run multiple fitting experiments in serial or parallel.
 #
 # 1. Update parameters ranges in run-experiments.jl
-# 2. Run: $ julia run-experiments.jl
+# 2. Run: $ julia --project=../../ run-experiments.jl
 # 3. After all experiments have been completed, run the following script to gather
 #    the results into a single csv: $ ./gather-results.sh
 #
@@ -11,11 +11,10 @@ using IterTools
 # Parameter labels
 labels = [  "experiment_path",
             "dataset_path",
-            "trainingset_filename",
-            "testset_filename",
-            "n_train_sys",
-            "n_test_sys",
-            "n_batches",
+            "dataset_filename",
+            "split_prop",
+            "max_train_sys",
+            "max_test_sys",
             "n_body",
             "max_deg",
             "r0",
@@ -25,9 +24,8 @@ labels = [  "experiment_path",
             "w_e",
             "w_f"]
 
-
 # Parallel execution. Warning: a high number of parallel experiments may degrade system performance.
-parallel = false
+parallel = true
 
 # Experiment folder
 experiments_path = "experiments/"
@@ -38,25 +36,27 @@ juliafile = "fit-ace.jl"
 # Parameter definitions ########################################################
 
 # dataset path
-dataset_path = ["../data/"]
+dataset_path = ["../../../data/"]
+
+# dataset filename
+dataset_filename = [ "HfB2-n24-585.exyz",
+                     "HfO2_cpmd_1000.xyz",
+                     "HfO2_cpmd_train_0_94_11_7700.xyz",
+                     "HfO2_relax_1000_989.xyz" ]
 
-# datasets filename
-trainingset_filename = ["TiO2trainingset.xyz"]
-testset_filename = ["TiO2testset.xyz"]
+# Split proportoin
+split_prop = 0.8:0.8
 
 # number of atomic configurations
-#n_systems = 100:100
-n_train_sys = 80:80
-n_test_sys = 20:20
+max_train_sys = 800:800
+max_test_sys = 200:200
 
-# number of batches per dataset
-n_batches = 8:8
 
 # n_body: body order. N: correlation order (N = n_body - 1)
-n_body = 2:5
+n_body = 2:2
 
 # max_deg: maximum polynomial degree
-max_deg = 3:6
+max_deg = 3:3
 
 # r0: An estimate on the nearest-neighbour distance for scaling, JuLIP.rnn() 
 #     function returns element specific earest-neighbour distance
@@ -66,43 +66,42 @@ r0 = 1.0:1.0 # ( rnn(:Hf) + rnn(:O) ) / 2.0 ?
 # rin = 0.65*r0 is the default
 
 # rcutoff or rcut: outer cutoff radius
-rcutoff = 4.0:7.0
+rcutoff = 5.0:5.0
 
 # D: specifies the notion of polynomial degree for which there is no canonical
 #    definition in the multivariate setting. Here we use SparsePSHDegree which
 #    specifies a general class of sparse basis sets; see its documentation for
 #    more details. Default: D = ACE1.SparsePSHDegree(; wL = rpi.wL, csp = rpi.csp)
 # wL: ?
-wL = 0.5:0.5:1.5
+wL = 1.0:1.0
 # csp: ?
-csp = 0.5:0.5:1.5
+csp = 1.0:1.0
 
 # pin: specifies the behaviour of the basis as the inner cutoff radius.
 # pin = 0 is the default.
 
 # w_e: energy weight, used during fitting in normal equations
-w_e = [1e-8, 1.0, 100.0]
+w_e = 1.0:1.0
 
 # w_f: force weight, used during fitting in normal equations
-w_f = [1e-8, 1.0, 100.0]
+w_f = 1.0:1.0
 
 
 # Run experiments ##############################################################
 
-run(`mkdir $experiments_path`)
-for params in product(dataset_path, trainingset_filename, testset_filename,
-                      n_train_sys, n_test_sys, n_batches,
-                      n_body, max_deg, r0, rcutoff, wL, csp, w_e, w_f)
+run(`mkdir -p $experiments_path`)
+for params in product( dataset_path, dataset_filename, split_prop, max_train_sys,
+                       max_test_sys, n_body, max_deg, r0, rcutoff, wL, csp, w_e, w_f)
     print("Launching experiment with parameters: ")
     currexp_path = reduce(*,map(s->"$s"*"-", params[2:end]))[1:end-1]
     params = vcat(["$(labels[1])", "$experiments_path$currexp_path/"],
                    vcat([ ["$l", "$p"] for (l, p) in zip(labels[2:end], params)]...))
     println("$params")
     
     if parallel
-        @async run(Cmd(`nohup julia $juliafile $params`, dir="./"));
+        @async run(Cmd(`nohup julia --project=../../ $juliafile $params`, dir="./"));
     else
-        run(Cmd(`julia $juliafile $params`, dir="./"));
+        run(Cmd(`julia --project=../../ $juliafile $params`, dir="./"));
     end
 
     println("")
diff --git a/workflows/NeuralACE-experimental/run-experiments.jl b/workflows/NeuralACE-experimental/run-experiments.jl
@@ -1,7 +1,7 @@
 # Run multiple fitting experiments in serial or parallel.
 #
 # 1. Update parameters ranges in run-experiments.jl
-# 2. Run: $ julia run-experiments.jl
+# 2. Run: $ julia --project=../../ run-experiments.jl
 # 3. After all experiments have been completed, run the following script to gather
 #    the results into a single csv: $ ./gather-results.sh
 #
@@ -41,10 +41,13 @@ juliafile = "fit-neural-ace.jl"
 # Parameter definitions ########################################################
 
 # dataset path
-dataset_path = ["../../data/"]
+dataset_path = ["../../../data/"]
 
 # dataset filename
-dataset_filename = ["HfB2-n24-585.exyz"]
+dataset_filename = [ "HfO2_cpmd_1000.xyz", 
+                     "HfO2_cpmd_train_0_94_11_7700.xyz",
+                     "HfO2_relax_1000_989.xyz", 
+                     "HfB2-n24-585.exyz"]
 
 # Split proportoin
 split_prop = 0.8:0.8
@@ -63,7 +66,7 @@ n_batches = 1:1
 optimiser = ["BFGS"]
 
 # Max. no. of optimizer iterations
-max_it = 70:70
+max_it = 100:100
 
 # n_body: body order. N: correlation order (N = n_body - 1)
 n_body = 2:2