xtaci · springfieldking · Apr 18, 2022 · springfieldking · Apr 27, 2022 · springfieldking
diff --git a/fec.cpp b/fec.cpp
@@ -2,12 +2,9 @@
 // Created by 理 傅 on 2017/1/2.
 //
 
-#include <err.h>
-#include <sys/time.h>
 #include <iostream>
 #include <stdexcept>
 #include "fec.h"
-#include "sess.h"
 #include "encoding.h"
 
 FEC::FEC(ReedSolomon enc) :enc(enc) {}
@@ -33,13 +30,11 @@ FEC::New(int rxlimit, int dataShards, int parityShards)  {
 }
 
 fecPacket
-FEC::Decode(byte *data, size_t sz) {
+FEC::Decode(byte *data, size_t sz, uint32_t ts) {
     fecPacket pkt;
     data = decode32u(data, &pkt.seqid);
     data = decode16u(data, &pkt.flag);
-    struct timeval time;
-    gettimeofday(&time, NULL);
-    pkt.ts = uint32_t(time.tv_sec * 1000 + time.tv_usec/1000);
+    pkt.ts = ts;
     pkt.data = std::make_shared<std::vector<byte>>(data, data+sz - fecHeaderSize);
     return pkt;
 }
@@ -62,11 +57,8 @@ FEC::MarkFEC(byte *data) {
     }
 }
 
-std::vector<row_type>
-FEC::Input(fecPacket &pkt) {
-    std::vector<row_type> recovered;
-
-    uint32_t now = currentMs();
+void
+FEC::Input(fecPacket &pkt, uint32_t now, std::vector<row_type>& recovered) {
     if (now-lastCheck >= fecExpire) {
         for (auto it = rx.begin();it !=rx.end();) {
             if (now - it->ts > fecExpire) {
@@ -78,13 +70,12 @@ FEC::Input(fecPacket &pkt) {
         lastCheck = now;
     }
 
-
     // insertion
     auto n = this->rx.size() -1;
     int insertIdx = 0;
     for (int i=n;i>=0;i--) {
         if (pkt.seqid == rx[i].seqid) {
-            return recovered;
+            return;
         } else if (pkt.seqid > rx[i].seqid) {
             insertIdx = i + 1;
             break;
@@ -113,10 +104,10 @@ FEC::Input(fecPacket &pkt) {
         int numDataShard = 0;
         int first = 0;
         size_t maxlen = 0;
-
-        std::vector<row_type> shardVec(totalShards);
-        std::vector<bool> shardflag(totalShards, false);
-
+        static thread_local std::vector<row_type> shardVec(totalShards);
+        static thread_local std::vector<bool> shardflag(totalShards, false);
+        std::fill(shardVec.begin(), shardVec.end(), nullptr);
+        std::fill(shardflag.begin(), shardflag.end(), false);
         for (auto i = searchBegin; i <= searchEnd; i++) {
             auto seqid = rx[i].seqid;
             if (seqid > shardEnd) {
@@ -163,7 +154,7 @@ FEC::Input(fecPacket &pkt) {
         rx.erase(rx.begin());
     }
 
-    return recovered;
+    return;
 }
 
 

diff --git a/fec.h b/fec.h
@@ -35,13 +35,13 @@ class FEC {
     inline bool isEnabled() { return dataShards > 0 && parityShards > 0 ; }
 
     // Input a FEC packet, and return recovered data if possible.
-    std::vector<row_type> Input(fecPacket &pkt);
+    void Input(fecPacket &pkt, uint32_t now, std::vector<row_type>& recovered);
 
     // Calc Parity Shards
     void Encode(std::vector<row_type> &shards);
 
     // Decode a raw array into fecPacket
-    static fecPacket Decode(byte *data, size_t sz);
+    static fecPacket Decode(byte *data, size_t sz,  uint32_t ts);
 
     // Mark raw array as typeData, and write correct size.
     void MarkData(byte *data, uint16_t sz);

diff --git a/fec_test.cpp b/fec_test.cpp
@@ -61,7 +61,8 @@ int main() {
         } else {
             pkt.flag = typeFEC;
         }
-        auto recovered = fec.Input(pkt);
+        std::vector<row_type> recovered;
+        fec.Input(pkt, 0, recovered);
 
         if (recovered.size() > 0) {
             std::cout << "recovered:" << std::endl;

diff --git a/galois_noasm.cpp b/galois_noasm.cpp
@@ -3,18 +3,17 @@
 //
 
 #include "galois_noasm.h"
-#include "matrix.h"
 
 extern const byte mulTable[256][256];
 
-void galMulSlice(byte c, row_type in, row_type out) {
-    for (int n=0;n<in->size();n++) {
-        (*out)[n] = mulTable[c][(*in)[n]];
-    }
+void galMulSlice(byte c, byte* in, byte* out, int size) {
+  for (int n = 0; n < size; n++) {
+    out[n] = mulTable[c][in[n]];
+  }
 }
 
-void galMulSliceXor(byte c, row_type in, row_type out) {
-    for (int n=0;n<in->size();n++) {
-        (*out)[n] ^= mulTable[c][(*in)[n]];
-    }
-}
+void galMulSliceXor(byte c, byte* in, byte* out, int size) {
+  for (int n = 0; n < size; n++) {
+    out[n] ^= mulTable[c][in[n]];
+  }
+}
diff --git a/galois_noasm.h b/galois_noasm.h
@@ -6,13 +6,12 @@
 #define KCP_GALOIS_NOASM_H
 
 #include "galois.h"
-#include "matrix.h"
 
 #ifdef __cplusplus
 extern "C" {
 #endif
-void galMulSlice(byte c,  row_type in, row_type out);
-void galMulSliceXor(byte c, row_type in, row_type out);
+void galMulSlice(byte c,  byte* in, byte* out, int size);
+void galMulSliceXor(byte c, byte* in, byte* out, int size);
 
 #ifdef __cplusplus
 }

diff --git a/inversion_tree.cpp b/inversion_tree.cpp
@@ -8,65 +8,65 @@
 inversionTree inversionTree::newInversionTree(int dataShards, int parityShards) {
     inversionTree tree;
     tree.m_root.m_children.resize(dataShards + parityShards, nullptr);
-    tree.m_root.m_matrix = matrix::identityMatrix(dataShards);
+    tree.m_root.m_matrix = std::make_shared<IdentityMatrix>(dataShards);
     return tree;
 }
 
 
-matrix
+MatrixPtr
 inversionTree::GetInvertedMatrix(std::vector<int> &invalidIndices) {
     if (invalidIndices.size() == 0) {
         return m_root.m_matrix;
     }
 
-    return m_root.getInvertedMatrix(invalidIndices, 0);
+    return m_root.getInvertedMatrix(invalidIndices, 0, 0);
 }
 
 int
-inversionTree::InsertInvertedMatrix(std::vector<int> &invalidIndices, matrix &matrix, int shards) {
+inversionTree::InsertInvertedMatrix(std::vector<int> &invalidIndices, MatrixPtr &matrix, int shards) {
     // If no invalid indices were given then we are done because the
     // m_root node is already set with the identity matrix.
     if (invalidIndices.size() == 0) {
         return -1;
     }
 
-    if (!matrix.IsSquare()) {
+    if (!matrix->IsSquare()) {
         return -2;
     }
 
     // Recursively create nodes for the inverted matrix in the tree until
     // we reach the node to insert the matrix to.  We start by passing in
     // 0 as the parent index as we start at the m_root of the tree.
-    m_root.insertInvertedMatrix(invalidIndices, matrix, shards, 0);
+    m_root.insertInvertedMatrix(invalidIndices, 0, matrix, shards, 0);
 
     return 0;
 }
 
-matrix
-inversionNode::getInvertedMatrix(std::vector<int> &invalidIndices, int parent) {
+MatrixPtr
+inversionNode::getInvertedMatrix(const std::vector<int> &invalidIndices, int index, int parent) {
     // Get the child node to search next from the list of m_children.  The
     // list of m_children starts relative to the parent index passed in
     // because the indices of invalid rows is sorted (by default).  As we
     // search recursively, the first invalid index gets popped off the list,
     // so when searching through the list of m_children, use that first invalid
     // index to find the child node.
-    int firstIndex = invalidIndices[0];
+    int firstIndex = invalidIndices[index];
     auto node = m_children[firstIndex - parent];
 
     // If the child node doesn't exist in the list yet, fail fast by
     // returning, so we can construct and insert the proper inverted matrix.
     if (node == nullptr) {
-        return matrix{};
+        return nullptr;
     }
 
     // If there's more than one invalid index left in the list we should
     // keep searching recursively.
-    if (invalidIndices.size() > 1) {
+    if (invalidIndices.size() - index> 1) {
         // Search recursively on the child node by passing in the invalid indices
         // with the first index popped off the front.  Also the parent index to
         // pass down is the first index plus one.
-        std::vector<int> v(invalidIndices.begin() + 1, invalidIndices.end());
-        return node->getInvertedMatrix(v, firstIndex + 1);
+        // no copy std::vector<int> v(invalidIndices.begin() + 1, invalidIndices.end());
+        return node->getInvertedMatrix(invalidIndices, index + 1, firstIndex + 1);
     }
 
     // If there aren't any more invalid indices to search, we've found our
@@ -79,8 +79,9 @@ inversionNode::getInvertedMatrix(std::vector<int> &invalidIndices, int parent) {
 
 void
 inversionNode::insertInvertedMatrix(
-        std::vector<int> &invalidIndices,
-        struct matrix &matrix,
+        const std::vector<int> &invalidIndices,
+        int index,
+        MatrixPtr &matrix,
         int shards,
         int parent) {
     // As above, get the child node to search next from the list of m_children.
@@ -89,7 +90,7 @@ inversionNode::insertInvertedMatrix(
     // search recursively, the first invalid index gets popped off the list,
     // so when searching through the list of m_children, use that first invalid
     // index to find the child node.
-    int firstIndex = invalidIndices[0];
+    int firstIndex = invalidIndices[index];
     auto node = m_children[firstIndex - parent];
 
     // If the child node doesn't exist in the list yet, create a new
@@ -109,13 +110,13 @@ inversionNode::insertInvertedMatrix(
     // If there's more than one invalid index left in the list we should
     // keep searching recursively in order to find the node to add our
     // matrix.
-    if (invalidIndices.size() > 1) {
+    if (invalidIndices.size() - index > 1) {
         // As above, search recursively on the child node by passing in
         // the invalid indices with the first index popped off the front.
         // Also the total number of shards and parent index are passed down
         // which is equal to the first index plus one.
-        std::vector<int> v(invalidIndices.begin() + 1, invalidIndices.end());
-        node->insertInvertedMatrix(v, matrix, shards, firstIndex + 1);
+        // no copy std::vector<int> v(invalidIndices.begin() + 1, invalidIndices.end());
+        node->insertInvertedMatrix(invalidIndices, index + 1, matrix, shards, firstIndex + 1);
     } else {
         node->m_matrix = matrix;
     }

diff --git a/inversion_tree.h b/inversion_tree.h
@@ -9,11 +9,11 @@
 #include "matrix.h"
 
 struct inversionNode {
-    struct matrix m_matrix;
+    MatrixPtr m_matrix;
     std::vector<std::shared_ptr<inversionNode>> m_children;
-    struct matrix getInvertedMatrix(std::vector<int> & invalidIndices, int parent);
+    MatrixPtr getInvertedMatrix(const std::vector<int> & invalidIndices, int index, int parent);
 
-    void insertInvertedMatrix(std::vector<int> &invalidIndices, struct matrix &matrix, int shards, int parent);
+    void insertInvertedMatrix(const std::vector<int> &invalidIndices, int index, MatrixPtr &matrix, int shards, int parent);
 };
 
 class inversionTree {
@@ -25,13 +25,13 @@ class inversionTree {
 
     // GetInvertedMatrix returns the cached inverted matrix or nil if it
     // is not found in the tree keyed on the indices of invalid rows.
-    matrix GetInvertedMatrix(std::vector<int> & invalidIndices);
+    MatrixPtr GetInvertedMatrix(std::vector<int> & invalidIndices);
 
     // InsertInvertedMatrix inserts a new inverted matrix into the tree
     // keyed by the indices of invalid rows.  The total number of shards
     // is required for creating the proper length lists of child nodes for
     // each node.
-    int InsertInvertedMatrix(std::vector<int> & invalidIndices, struct matrix &matrix, int shards);
+    int InsertInvertedMatrix(std::vector<int> & invalidIndices, MatrixPtr &matrix, int shards);
 
 private:
     inversionNode m_root;