PinguDevTeam · dorukaks · Nov 29, 2022 · Nov 29, 2022 · Nov 29, 2022 · Nov 29, 2022
diff --git a/compressionPipeline.py b/compressionPipeline.py
@@ -0,0 +1,103 @@
+import os
+import time
+
+import numpy as np
+import TTICE as ttice
+
+method = "ttsvd"
+heuristics = ["skip", "occupancy"]
+occThreshold = 1
+compMetrFile = "compressionMetrics.txt"  # This file is for me
+lines2Print = []
+"""
+Don't modify those 3 lines above they are settings to the compression algorithm.
+"""
+
+cwd = os.getcwd()
+epsilon = 0.05  # This is the relative approximation error threshold
+nTrainingRuns = 640  # Modify this number accordingly
+stpIdx = (
+    300  # If you downsample before saving data, change this to an appropriate number
+)
+step = 10  # If you downsample before saving data, change this to 1
+iterStep = 1
+
+dataDir = "./"  # Folder that the 2048x1528x3x300 numpy arrays are stored
+# I suggest you to put all the training runs in one folder
+saveDir = "./"  # Folder that you will save the TT-cores
+saveName = "trainedCore"  # Name of the saved TT-core files
+dataName = "run_"  # I assumed that you name all the run files "run_<runIdx>"
+
+"""
+Pick one of the two loops below and proceed
+"""
+# OPTION 1
+# If you use the following loop, have all the train runs at one place
+for runIdx in os.listdir():
+    data = np.load(dataDir + runIdx, mmap_mode="r")
+# OPTION 2
+# If you use the following loop, name the training runs with consecutive
+#  numbers starting from 0
+for runIdx in range(nTrainingRuns):
+    print(f"Run: {runIdx}")
+    data = np.load(dataDir + dataName + f"{runIdx}", mmap_mode="r")
+
+    # After you pick one of the loops above, comment the other.
+    # The rest should be in the same loop since we are compressing.
+
+    stIdx = 0
+    if runIdx == 0:
+        # I'm checking here if we are at the first run. Please modify this if
+        # statement accordingly
+        dataSet = ttice.ttObject(
+            data[:, :, :, stIdx][:, :, :, None],
+            epsilon=epsilon,
+            keepData=False,
+            samplesAlongLastDimension=True,
+            method=method,
+        )
+        dataSet.changeShape([16, 32, 32, 191, 3, 1])
+        dataSet.ttDecomp()
+        lines2Print.append(f"{0}")
+        lines2Print.append(f"{dataSet.compressionTime}")
+        lines2Print.append(f"{dataSet.compressionRatio}")
+        lines2Print.append(" ".join(map(str, dataSet.ttRanks)))
+        lines2Print.append("\n")
+
+        # If you end up downsampling the timesteps before saving the data, change
+        # this to 1
+        stIdx = 9
+    else:
+        stIdx = 0
+
+    for iterIdx in range(stIdx, stpIdx, step):
+        stTime = time.time()
+        streamedTensor = data[:, :, :, iterIdx][:, :, :, None].reshape(
+            dataSet.reshapedShape[:-1] + [-1]
+        )
+        dataSet.ttICEstar(
+            streamedTensor,
+            epsilon=epsilon,
+            heuristicsToUse=heuristics,
+            occupancyThreshold=occThreshold,
+        )
+        stepTime = time.time() - stTime
+        lines2Print.append(f"{iterStep}")
+        lines2Print.append(f"{stepTime}")
+        lines2Print.append(f"{dataSet.compressionRatio}")
+        lines2Print.append(" ".join(map(str, dataSet.ttRanks)))
+        lines2Print.append("\n")
+        print(
+            f"Run {runIdx} timestep {iterIdx} (overall: {iterStep})\
+                done in {round(stepTime,4)}s"
+        )
+        with open(compMetrFile, "a") as txt:
+            txt.writelines(" ".join(lines2Print))
+        lines2Print = []
+        iterStep += 1
+    """
+    I'm saving after each simulation here, it will slow down compression time a little
+    bit but it will save us a lot of valuable time if compression fails prematurely for
+    some reason
+    """
+    dataSet.saveData(saveName, directory=saveDir, justCores=True, outputType="npy")
diff --git a/src/TTICE/__init__.py b/src/TTICE/__init__.py
@@ -1,11 +1,12 @@
-def testFcn(a):
-    """This is a test function to check if docstrings are working
+"""
+Welcome to TTICE documentation!
 
-    Args:
-        a (float): random value
+This python package currently offers support for multidimensional tensors
+in Tensor-Train format.We use the TT-SVD algorithm proposed by Ivan Oseledets
+and TT-ICE algorithm proposed by Doruk Aksoy.
 
-    Returns:
-        (float): input plus 2
-    """
-    a += 2
-    return a
+In future releases, the coverage may be extended to other tensor decomposition formats
+such as CP and/or Tucker.
+"""
+
+from .ttObject import ttObject  # noqa: F401
diff --git a/src/TTICE/template_TT_ICE_documentation.py → src/TTICE/test_TTICE_documentation.py b/src/TTICE/template_TT_ICE_documentation.py → src/TTICE/test_TTICE_documentation.py
@@ -20,10 +20,14 @@ def templateFunction(arg1, arg2):
     return m
 
 
-def main():
-    """This is the main function (TT-ICE)"""
-    print(templateFunction(1, 2))
-
-
-if __name__ == "__main__":
-    main()
+class main:
+    def __init__(
+        self,
+        data,
+        epsilon: float = None,
+        keepData: bool = False,
+        samplesAlongLastDimension: bool = True,
+        method: str = "ttsvd",
+    ):
+        """This is the main function (TTICE)"""
+        print(templateFunction(1, 2))
diff --git a/src/TTICE/TTICE.rst → src/TTICE/trial123.rst b/src/TTICE/TTICE.rst → src/TTICE/trial123.rst