From db1bc7ff11bd12784ba486b936ff93fb61e76210 Mon Sep 17 00:00:00 2001
From: AbsoluteVacuum <32832158+AbsoluteVacuum@users.noreply.github.com>
Date: Fri, 27 Oct 2023 12:49:15 +0300
Subject: [PATCH 1/2] Update ovftools.py

_fast_binary_decode cleanup, readout shape correction and improvement
_text_decode cleanup, improvement and speedup
---
 mx3tools/ovftools.py | 58 +++++++++++++++-----------------------------
 1 file changed, 20 insertions(+), 38 deletions(-)

diff --git a/mx3tools/ovftools.py b/mx3tools/ovftools.py
index 96afb16..7c830bf 100644
--- a/mx3tools/ovftools.py
+++ b/mx3tools/ovftools.py
@@ -5,6 +5,12 @@
 #
 # The _fast_binary_decode function uses numpy's ndarray constructor to eliminate the need for loops, dramatically
 # reducing the time needed to move the data read from the file object into an array (~100x speedup).
+# 
+# The _text_decode function uses numpy's loadtxt to eliminate the need for loops.
+# Also, it now supports scalar text data.
+# 
+# unpack() works on both text and binary format (prefer the binary! it is much less heavy)
+# unpack() works on both scalar and vector data (ouput shape is always [znodes, ynodes, xnodes, valuedim] )
 
 import re
 import numpy as np
@@ -89,6 +95,7 @@ def _read_header(fobj):
                     "xnodes",
                     "ynodes",
                     "znodes",
+                    "valuedim",
                     "valuemultiplier"]:
             if key in line:
                 headers[key] = float(line.split(': ')[1])
@@ -144,42 +151,27 @@ def _binary_decode(f, chunk_size, decoder, headers, dtype):
 
 
 def _text_decode(f, headers):
-
-    data = np.empty((int(headers['znodes']),
-                     int(headers['ynodes']),
-                     int(headers['xnodes']), 3), dtype=float)
-
-    for k in range(data.shape[0]):
-        for j in range(data.shape[1]):
-            for i in range(data.shape[2]):
-                text = f.readline().strip().split()
-                data[k, j, i] = (float(text[0]), float(text[1]), float(text[2]))
+    
+    arrshape=[int(headers[key]) for key in ['znodes','ynodes','xnodes','valuedim']]
+    
+    data = np.loadtxt(f, max_rows=np.prod(arrshape[:3])).reshape(arrshape)
 
     return data*headers.get('valuemultiplier', 1)
 
 
 def _fast_binary_decode(f, chunk_size, headers, dtype):
 
-    xs, ys, zs = (int(headers['xnodes']), int(headers['ynodes']), int(headers['znodes']))
-    ret = np.ndarray(shape=(xs*ys*zs, 3),
+    arrshape=[int(headers[key]) for key in ['znodes','ynodes','xnodes','valuedim']]
+    ret = np.ndarray(shape=arrshape,
                      dtype=dtype,
-                     buffer=f.read(xs*ys*zs*3*chunk_size),
-                     offset=0,
-                     strides=(3*chunk_size, chunk_size))
-
-    return ret.reshape((zs, ys, xs, 3))
+                     buffer=f.read(np.prod(arrshape)*chunk_size),
+                     offset=0
+                     )
+    return ret
 
 
 def _fast_binary_decode_scalars(f, chunk_size, headers, dtype):
-
-    xs, ys, zs = (int(headers['xnodes']), int(headers['ynodes']), int(headers['znodes']))
-    ret = np.ndarray(shape=(xs*ys*zs, 1),
-                     dtype=dtype,
-                     buffer=f.read(xs*ys*zs*chunk_size),
-                     offset=0,
-                     strides=(chunk_size, chunk_size))
-
-    return ret.reshape((zs, ys, xs))
+    return _fast_binary_decode(f, chunk_size, headers, dtype)[...,0]
 
 
 def group_unpack(path, pattern='m'):
@@ -225,18 +217,8 @@ def group_unpack(path, pattern='m'):
 
 
 def unpack_scalars(path):
-    path = ioutil.pathize(path)
-
-    with path.open('rb') as f:
-        headers = _read_header(f)
-
-        if headers['data_type'][3] == 'Binary':
-            chunk_size = int(headers['data_type'][4])
-            return _fast_binary_decode_scalars(f, chunk_size, headers, _endianness(f, chunk_size))
-
-        else:
-            raise NotImplementedError
-
+    return unpack(path)[...,0]
+    
 
 def as_rodrigues(path, fname):
     """For each m*.ovf file in the given directory, generate a corresponding .csv containing the indices, rotation

From 2d5b494e0fafc41b30a60f78df6b326a7173519b Mon Sep 17 00:00:00 2001
From: AbsoluteVacuum <32832158+AbsoluteVacuum@users.noreply.github.com>
Date: Sun, 24 Dec 2023 00:27:41 +0200
Subject: [PATCH 2/2] import-only version of ovftools.py

works on both text and binary format (prefer the binary! it is much less heavy)
works on both scalar and vector data (ouput shape is always [znodes, ynodes, xnodes, valuedim] )

How to use:
place this file in your working folder  and use "from workingfolder import unpack"
and then use unpack("mumax-generated-file.ovf")
---
 mx3tools/mx3import.py | 140 ++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 140 insertions(+)
 create mode 100644 mx3tools/mx3import.py

diff --git a/mx3tools/mx3import.py b/mx3tools/mx3import.py
new file mode 100644
index 0000000..4715cb1
--- /dev/null
+++ b/mx3tools/mx3import.py
@@ -0,0 +1,140 @@
+# This code is based on oommfdecode.py by Duncan Parkes:
+# https://github.com/deparkes/OOMMFTools/blob/master/oommftools/core/oommfdecode.py
+# and also ovftools.py by Peyton Murray
+# https://github.com/peytondmurray/mx3tools/blob/master/mx3tools/ovftools.py
+#
+# How to use: 
+# place this file in your working folder and use "from mx3import import unpack"
+# and then use unpack("mumax-generated-file.ovf")
+#
+# works on both text and binary format (prefer the binary! it is much less heavy)
+# works on both scalar and vector data (ouput shape is always [znodes, ynodes, xnodes, valuedim] )
+
+import numpy as np
+import struct
+import pathlib
+
+def pathize(path):
+    """Takes a string or pathlib.Path object and return the corresponding pathlib.Path object.
+
+    Parameters
+    ----------
+    path : str or pathlib.Path
+        Input path
+
+    Returns
+    -------
+    pathlib.Path
+        Returns a pathlib.Path object
+    """
+
+    if isinstance(path, str):
+        return pathlib.Path(path)
+    elif isinstance(path, pathlib.PurePath):
+        return path
+    else:
+        raise TypeError(f'Invalid path type: {type(path)}')
+
+
+def unpack(path):
+    path = pathize(path)
+
+    with path.open('rb') as f:
+        headers = _read_header(f)
+
+        if headers['data_type'][3] == 'Text':
+            return _text_decode(f, headers)
+
+        elif headers['data_type'][3] == 'Binary':
+            chunk_size = int(headers['data_type'][4])
+            return _fast_binary_decode(f, chunk_size, headers, _endianness(f, chunk_size))
+
+
+def _read_header(fobj):
+    """Read headers from OVF file object. fobj must be opened in 'rb' mode (read as bytes).
+
+    Parameters
+    ----------
+    fobj : file
+        OVF file to read, must be opened in bytes mode (mode='rb')
+
+    Returns
+    -------
+    dict
+        Dictionary containing the [important] header keys and values
+    """
+
+    headers = {'SimTime': -1, 'Iteration': -1, 'Stage': -1, 'MIFSource': ''}
+
+    line = ''
+    while 'Begin: Data' not in line:
+
+        line = fobj.readline().strip().decode()
+
+        for key in ["xbase",
+                    "ybase",
+                    "zbase",
+                    "xstepsize",
+                    "ystepsize",
+                    "zstepsize",
+                    "xnodes",
+                    "ynodes",
+                    "znodes",
+                    "valuemultiplier",
+                    "valuedim"]:
+            if key in line:
+                headers[key] = float(line.split(': ')[1])
+
+        if 'Total simulation time' in line:
+            headers['SimTime'] = float(line.split(':')[-1].strip().split()[0].strip())
+        elif 'Iteration' in line:
+            headers['Iteration'] = float(line.split(':')[2].split(',')[0].strip())
+        # elif 'Stage' in line:
+        #     headers['Stage'] = float(line.split(':')[2].split(',')[0].strip())
+        elif 'MIF source file' in line:
+            headers['MIFSource'] = line.split(':', 2)[2].strip()
+        else:
+            continue
+
+    headers['data_type'] = line.split()
+
+    return headers
+
+
+def _byte_decoder(endianness):
+    return struct.Struct(endianness)
+
+
+def _endianness(f, nbytes):
+    buffer = f.read(nbytes)
+
+    big_endian = {4: '>f', 8: '>d'}
+    little_endian = {4: '<f', 8: '<d'}
+    value = {4: 1234567.0, 8: 123456789012345.0}
+
+    if struct.unpack(big_endian[nbytes], buffer)[0] == value[nbytes]:       # Big endian?
+        return big_endian[nbytes]
+    elif struct.unpack(little_endian[nbytes], buffer)[0] == value[nbytes]:  # Little endian?
+        return little_endian[nbytes]
+    else:
+        raise IOError(f'Cannot decode {nbytes}-byte order mark: ' + hex(buffer))
+
+def _text_decode(f, headers):
+    
+    arrshape=[int(headers[key]) for key in ['znodes','ynodes','xnodes','valuedim']]
+    
+    data = np.loadtxt(f, max_rows=np.prod(arrshape[:3])).reshape(arrshape)
+
+    return data*headers.get('valuemultiplier', 1)
+
+
+def _fast_binary_decode(f, chunk_size, headers, dtype):
+
+    arrshape=[int(headers[key]) for key in ['znodes','ynodes','xnodes','valuedim']]
+    ret = np.ndarray(shape=arrshape,
+                     dtype=dtype,
+                     buffer=f.read(np.prod(arrshape)*chunk_size),
+                     offset=0
+                     )
+
+    return ret