Merge branch 'v3.007-dev-new' into HEAD

* v3.007-dev-new: (246 commits) Taskable: Fixes compilation for Taskable.test.mq4 Std: Uses Alert() and DebugBreak() for MQL only Workaround for closing order conditions after orders are loaded from active pool (GH-705) Trade: TradeParams: Adds max_spread Order: Fixes the current volume value when data in orequest is missing Order: Refresh order after modification Trade: Disables filling modes for MQL4 Account/AccountMt: Fixes zero division Refs EA31337-classes/EA31337-indicators-other#13, EA31337-classes/EA31337-indicators-other#15. WIP. TDI-RT-Clone and Heiken_Ashi_Smoothed indicators made to work in MT5. GHA: Compile: Adds support for path input ACQUIRE_BUFFERn / RELEASE_BUFFERn functionality required for EA31337/EA31337-indicators-stats#1 SerializerConverter: Fixes error: member reference base type 'C *' is not a structure Fixes nullptr undeclared identifier Minor fixes C++ compatibility fixes. Account/AccountMt: Fixes zero division GHA: Compile: Support for workflow calls GHA: Compile: Skips clean-up by default GHA: Fixes compilation workflows Trade: Disables filling modes for MQL4 ...
EA31337 · May 1, 2024 · 979924a · 979924a
1 parent 5e14147
commit 979924a
Show file tree

Hide file tree

Showing 11 changed files with 980 additions and 186 deletions.
diff --git a/Array.mqh b/Array.mqh
@@ -772,7 +772,7 @@ template <typename X>
 
 template <typename X>
 void ArrayPush(ARRAY_REF(X, array), X value) {
-  ArrayResize(Array::ArraySize(array) + 1);
+  ArrayResize(array, ArraySize(array) + 1);
   array[ArraySize(array) - 1] = value;
 }
 template <typename X>

diff --git a/Indicator.struct.h b/Indicator.struct.h
@@ -152,7 +152,7 @@ struct IndicatorParams {
   }
   void SetMaxParams(int _value) {
     max_params = _value;
-    ArrayResize(input_params, max_params);
+    ArrayResize(input_params, (int)max_params);
   }
   void SetName(string _name) { name = _name; };
   void SetShift(int _shift) { shift = _shift; }

diff --git a/Indicators/Account/tests/Indi_AccountStats.test.mq5 b/Indicators/Account/tests/Indi_AccountStats.test.mq5
@@ -58,4 +58,4 @@ void OnTick() {
       assertTrueOrExit(_entry.IsValid(), "Invalid entry!");
     }
   }
-}
+}
diff --git a/Matrix.matmul.cl b/Matrix.matmul.cl
@@ -0,0 +1,115 @@
+#define WIDTH 1
+#define TSM 128                // The tile-size in dimension M
+#define TSN 128                // The tile-size in dimension N
+#define TSK 16                 // The tile-size in dimension K
+#define WPTM 8                 // The work-per-thread in dimension M
+#define WPTN 8                 // The work-per-thread in dimension N
+#define RTSM (TSM/WPTM)        // The reduced tile-size in dimension M
+#define RTSN (TSN/WPTN)        // The reduced tile-size in dimension N
+#define LPTA ((TSK*TSM)/(RTSM*RTSN)) // Loads-per-thread for A
+#define LPTB ((TSK*TSN)/(RTSM*RTSN)) // Loads-per-thread for B
+__kernel void matmul(const int M, const int N, const int K,
+                      const __global double* A,
+                      const __global double* B,
+                      __global float* C) {
+
+    // Thread identifiers
+    const int tidm = get_local_id(0); // Local row ID (max: TSM/WPTM)
+    const int tidn = get_local_id(1); // Local col ID (max: TSN/WPTN)
+    const int offsetM = TSM*get_group_id(0); // Work-group offset
+    const int offsetN = TSN*get_group_id(1); // Work-group offset
+
+    // Local memory to fit a tile of A and B
+    __local float Asub[TSK][TSM];
+    __local float Bsub[TSK][TSN];
+
+    // Allocate register space
+    float Areg;
+    float Breg[WPTN];
+    float acc[WPTM][WPTN];
+
+    // Initialise the accumulation registers
+    for (int wm=0; wm<WPTM; wm++) {
+        for (int wn=0; wn<WPTN; wn++) {
+            acc[wm][wn] = 0.0f;
+        }
+    }
+
+    // Loop over all tiles
+    int numTiles = K/TSK;
+    for (int t=0; t<numTiles; t++) {
+
+        // Load one tile of A and B into local memory
+        for (int la=0; la<LPTA/WIDTH; la++) {
+            int tid = tidn*RTSM + tidm;
+            int id = la*RTSN*RTSM + tid;
+            int row = id % (TSM/WIDTH);
+            int col = id / (TSM/WIDTH);
+
+            // Load the values (wide vector load)
+            int tiledIndex = TSK*t + col;
+            double vecA = A[tiledIndex*(M/WIDTH) + offsetM/WIDTH + row];
+            double vecB = B[tiledIndex*(N/WIDTH) + offsetN/WIDTH + row];
+
+            // Store the loaded vectors into local memory
+            #if WIDTH == 1
+                Asub[col][row] = vecA;
+                Asub[col][row] = vecA;
+            #elif WIDTH == 2
+                Asub[col][WIDTH*row + 0] = vecA.x;
+                Asub[col][WIDTH*row + 1] = vecA.y;
+            #elif WIDTH == 4
+                Asub[col][WIDTH*row + 0] = vecA.x;
+                Asub[col][WIDTH*row + 1] = vecA.y;
+                Asub[col][WIDTH*row + 2] = vecA.z;
+                Asub[col][WIDTH*row + 3] = vecA.w;
+            #endif
+            #if WIDTH == 1
+                Bsub[col][row] = vecB;
+                Bsub[col][row] = vecB;
+            #elif WIDTH == 2
+                Bsub[col][WIDTH*row + 0] = vecB.x;
+                Bsub[col][WIDTH*row + 1] = vecB.y;
+            #elif WIDTH == 4
+                Bsub[col][WIDTH*row + 0] = vecB.x;
+                Bsub[col][WIDTH*row + 1] = vecB.y;
+                Bsub[col][WIDTH*row + 2] = vecB.z;
+                Bsub[col][WIDTH*row + 3] = vecB.w;
+            #endif
+        }
+
+        // Synchronise to make sure the tile is loaded
+        barrier(CLK_LOCAL_MEM_FENCE);
+
+        // Loop over the values of a single tile
+        for (int k=0; k<TSK; k++) {
+
+            // Cache the values of Bsub in registers
+            for (int wn=0; wn<WPTN; wn++) {
+                int col = tidn + wn*RTSN;
+                Breg[wn] = Bsub[k][col];
+            }
+
+            // Perform the computation
+            for (int wm=0; wm<WPTM; wm++) {
+                int row = tidm + wm*RTSM;
+                Areg = Asub[k][row];
+                for (int wn=0; wn<WPTN; wn++) {
+                    acc[wm][wn] += Areg * Breg[wn];
+                }
+            }
+        }
+
+        // Synchronise before loading the next tile
+        barrier(CLK_LOCAL_MEM_FENCE);
+    }
+
+    // Store the final results in C
+    for (int wm=0; wm<WPTM; wm++) {
+        int globalRow = offsetM + tidm + wm*RTSM;
+        for (int wn=0; wn<WPTN; wn++) {
+            int globalCol = offsetN + tidn + wn*RTSN;
+            C[globalCol*M + globalRow] = acc[wm][wn];
+        }
+    }
+}
diff --git a/Matrix.matmul.naive.cl b/Matrix.matmul.naive.cl
@@ -0,0 +1,14 @@
+#pragma OPENCL EXTENSION cl_khr_fp64 : enable
+
+__kernel void matmul(__global double* A, __global double* B, __global double* C, int rowsA, int colsA, int colsB) {
+  int i = get_global_id(0);
+  int j = get_global_id(1);
+
+  if (i < rowsA && j < colsB) {
+    float sum = 0.0f;
+    for (int k = 0; k < colsA; ++k) {
+      sum += A[i * colsA + k] * B[k * colsB + j];
+    }
+    C[i * colsB + j] = sum;
+  }
+}
diff --git a/Matrix.matmul.test.cl b/Matrix.matmul.test.cl
@@ -0,0 +1,19 @@
+#pragma OPENCL EXTENSION cl_khr_fp64 : enable
+__kernel void matmul(const int M, const int N, const int K,
+                      const __global double* A,
+                      const __global double* B,
+                      __global double* C) {
+
+    // Thread identifiers
+    //const int globalRow = get_global_id(0); // Row ID of C (0..M)
+    //const int globalCol = get_global_id(1); // Col ID of C (0..N)
+
+    // Compute a single element (loop over K)
+    //float acc = 0.0f;
+    //for (int k=0; k<K; k++) {
+        //acc += A[k*M + globalRow] * B[globalCol*K + k];
+    //}
+
+    // Store the result
+    //C[globalCol*M + globalRow] = acc;
+}
-Original file line number
+Diff line change
@@ Expand Up / @@ -58,4 +58,4 @@ void OnTick() { @@
           assertTrueOrExit(_entry.IsValid(), "Invalid entry!");
         }
       }
-    }
+    }