xref: /OK3568_Linux_fs/external/rknpu2/examples/rknn_benchmark/src/cnpy/cnpy.h (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // Copyright (C) 2011  Carl Rogers
2*4882a593Smuzhiyun // Released under MIT License
3*4882a593Smuzhiyun // license available in LICENSE file, or at http://www.opensource.org/licenses/mit-license.php
4*4882a593Smuzhiyun 
5*4882a593Smuzhiyun #ifndef LIBCNPY_H_
6*4882a593Smuzhiyun #define LIBCNPY_H_
7*4882a593Smuzhiyun 
8*4882a593Smuzhiyun #if 0
9*4882a593Smuzhiyun #include <zlib.h>
10*4882a593Smuzhiyun #endif
11*4882a593Smuzhiyun 
12*4882a593Smuzhiyun #include <stdint.h>
13*4882a593Smuzhiyun 
14*4882a593Smuzhiyun #include <cassert>
15*4882a593Smuzhiyun #include <cstdio>
16*4882a593Smuzhiyun #include <fstream>
17*4882a593Smuzhiyun #include <iostream>
18*4882a593Smuzhiyun #include <map>
19*4882a593Smuzhiyun #include <memory>
20*4882a593Smuzhiyun #include <numeric>
21*4882a593Smuzhiyun #include <sstream>
22*4882a593Smuzhiyun #include <stdexcept>
23*4882a593Smuzhiyun #include <string>
24*4882a593Smuzhiyun #include <typeinfo>
25*4882a593Smuzhiyun #include <vector>
26*4882a593Smuzhiyun 
27*4882a593Smuzhiyun namespace cnpy {
28*4882a593Smuzhiyun 
29*4882a593Smuzhiyun struct NpyArray
30*4882a593Smuzhiyun {
NpyArrayNpyArray31*4882a593Smuzhiyun   NpyArray(const std::vector<size_t>& _shape, size_t _word_size, bool _fortran_order, std::string _typeName)
32*4882a593Smuzhiyun     : shape(_shape)
33*4882a593Smuzhiyun     , word_size(_word_size)
34*4882a593Smuzhiyun     , fortran_order(_fortran_order)
35*4882a593Smuzhiyun     , typeName(_typeName)
36*4882a593Smuzhiyun   {
37*4882a593Smuzhiyun     num_vals = 1;
38*4882a593Smuzhiyun     for (size_t i = 0; i < shape.size(); i++)
39*4882a593Smuzhiyun       num_vals *= shape[i];
40*4882a593Smuzhiyun     data_holder = std::shared_ptr<std::vector<char>>(new std::vector<char>(num_vals * word_size));
41*4882a593Smuzhiyun   }
42*4882a593Smuzhiyun 
NpyArrayNpyArray43*4882a593Smuzhiyun   NpyArray()
44*4882a593Smuzhiyun     : shape(0)
45*4882a593Smuzhiyun     , word_size(0)
46*4882a593Smuzhiyun     , fortran_order(0)
47*4882a593Smuzhiyun     , num_vals(0)
48*4882a593Smuzhiyun   {}
49*4882a593Smuzhiyun 
50*4882a593Smuzhiyun   template <typename T>
dataNpyArray51*4882a593Smuzhiyun   T* data()
52*4882a593Smuzhiyun   {
53*4882a593Smuzhiyun     return reinterpret_cast<T*>(&(*data_holder)[0]);
54*4882a593Smuzhiyun   }
55*4882a593Smuzhiyun 
56*4882a593Smuzhiyun   template <typename T>
dataNpyArray57*4882a593Smuzhiyun   const T* data() const
58*4882a593Smuzhiyun   {
59*4882a593Smuzhiyun     return reinterpret_cast<T*>(&(*data_holder)[0]);
60*4882a593Smuzhiyun   }
61*4882a593Smuzhiyun 
62*4882a593Smuzhiyun   template <typename T>
as_vecNpyArray63*4882a593Smuzhiyun   std::vector<T> as_vec() const
64*4882a593Smuzhiyun   {
65*4882a593Smuzhiyun     const T* p = data<T>();
66*4882a593Smuzhiyun     return std::vector<T>(p, p + num_vals);
67*4882a593Smuzhiyun   }
68*4882a593Smuzhiyun 
num_bytesNpyArray69*4882a593Smuzhiyun   size_t num_bytes() const { return data_holder->size(); }
70*4882a593Smuzhiyun 
71*4882a593Smuzhiyun   std::shared_ptr<std::vector<char>> data_holder;
72*4882a593Smuzhiyun   std::vector<size_t>                shape;
73*4882a593Smuzhiyun   size_t                             word_size;
74*4882a593Smuzhiyun   bool                               fortran_order;
75*4882a593Smuzhiyun   size_t                             num_vals;
76*4882a593Smuzhiyun   std::string                        typeName;
77*4882a593Smuzhiyun };
78*4882a593Smuzhiyun 
79*4882a593Smuzhiyun using npz_t = std::map<std::string, NpyArray>;
80*4882a593Smuzhiyun 
81*4882a593Smuzhiyun char BigEndianTest(int size);
82*4882a593Smuzhiyun char map_type(const std::type_info& t);
83*4882a593Smuzhiyun template <typename T>
84*4882a593Smuzhiyun std::vector<char> create_npy_header(const std::vector<size_t>& shape);
85*4882a593Smuzhiyun void              parse_npy_header(FILE* fp, size_t& word_size, std::vector<size_t>& shape, bool& fortran_order,
86*4882a593Smuzhiyun                                    std::string& typeName);
87*4882a593Smuzhiyun void     parse_npy_header(unsigned char* buffer, size_t& word_size, std::vector<size_t>& shape, bool& fortran_order,
88*4882a593Smuzhiyun                           std::string& typeName);
89*4882a593Smuzhiyun void     parse_zip_footer(FILE* fp, uint16_t& nrecs, size_t& global_header_size, size_t& global_header_offset);
90*4882a593Smuzhiyun npz_t    npz_load(std::string fname);
91*4882a593Smuzhiyun NpyArray npz_load(std::string fname, std::string varname);
92*4882a593Smuzhiyun NpyArray npy_load(std::string fname);
93*4882a593Smuzhiyun 
94*4882a593Smuzhiyun template <typename T>
95*4882a593Smuzhiyun std::vector<char>& operator+=(std::vector<char>& lhs, const T rhs)
96*4882a593Smuzhiyun {
97*4882a593Smuzhiyun   // write in little endian
98*4882a593Smuzhiyun   for (size_t byte = 0; byte < sizeof(T); byte++) {
99*4882a593Smuzhiyun     char val = *((char*)&rhs + byte);
100*4882a593Smuzhiyun     lhs.push_back(val);
101*4882a593Smuzhiyun   }
102*4882a593Smuzhiyun   return lhs;
103*4882a593Smuzhiyun }
104*4882a593Smuzhiyun 
105*4882a593Smuzhiyun template <>
106*4882a593Smuzhiyun std::vector<char>& operator+=(std::vector<char>& lhs, const std::string rhs);
107*4882a593Smuzhiyun template <>
108*4882a593Smuzhiyun std::vector<char>& operator+=(std::vector<char>& lhs, const char* rhs);
109*4882a593Smuzhiyun 
110*4882a593Smuzhiyun template <typename T>
111*4882a593Smuzhiyun int npy_save(std::string fname, const T* data, const std::vector<size_t> shape, std::string mode = "w")
112*4882a593Smuzhiyun {
113*4882a593Smuzhiyun   std::ofstream ofs(fname, std::ios::out);
114*4882a593Smuzhiyun   if (!ofs.is_open()) {
115*4882a593Smuzhiyun     return -1;
116*4882a593Smuzhiyun   }
117*4882a593Smuzhiyun   ofs.close();
118*4882a593Smuzhiyun   FILE*               fp = NULL;
119*4882a593Smuzhiyun   std::vector<size_t> true_data_shape; // if appending, the shape of existing + new data
120*4882a593Smuzhiyun 
121*4882a593Smuzhiyun   if (mode == "a")
122*4882a593Smuzhiyun     fp = fopen(fname.c_str(), "r+b");
123*4882a593Smuzhiyun 
124*4882a593Smuzhiyun   if (fp) {
125*4882a593Smuzhiyun     // file exists. we need to append to it. read the header, modify the array size
126*4882a593Smuzhiyun     size_t      word_size;
127*4882a593Smuzhiyun     bool        fortran_order;
128*4882a593Smuzhiyun     std::string typeName;
129*4882a593Smuzhiyun     parse_npy_header(fp, word_size, true_data_shape, fortran_order, typeName);
130*4882a593Smuzhiyun     assert(!fortran_order);
131*4882a593Smuzhiyun 
132*4882a593Smuzhiyun     if (word_size != sizeof(T)) {
133*4882a593Smuzhiyun       std::cout << "libnpy error: " << fname << " has word size " << word_size << " but npy_save appending data sized "
134*4882a593Smuzhiyun                 << sizeof(T) << "\n";
135*4882a593Smuzhiyun       assert(word_size == sizeof(T));
136*4882a593Smuzhiyun     }
137*4882a593Smuzhiyun     if (true_data_shape.size() != shape.size()) {
138*4882a593Smuzhiyun       std::cout << "libnpy error: npy_save attempting to append misdimensioned data to " << fname << "\n";
139*4882a593Smuzhiyun       assert(true_data_shape.size() != shape.size());
140*4882a593Smuzhiyun     }
141*4882a593Smuzhiyun 
142*4882a593Smuzhiyun     for (size_t i = 1; i < shape.size(); i++) {
143*4882a593Smuzhiyun       if (shape[i] != true_data_shape[i]) {
144*4882a593Smuzhiyun         std::cout << "libnpy error: npy_save attempting to append misshaped data to " << fname << "\n";
145*4882a593Smuzhiyun         assert(shape[i] == true_data_shape[i]);
146*4882a593Smuzhiyun       }
147*4882a593Smuzhiyun     }
148*4882a593Smuzhiyun     true_data_shape[0] += shape[0];
149*4882a593Smuzhiyun   } else {
150*4882a593Smuzhiyun     fp              = fopen(fname.c_str(), "wb");
151*4882a593Smuzhiyun     true_data_shape = shape;
152*4882a593Smuzhiyun   }
153*4882a593Smuzhiyun 
154*4882a593Smuzhiyun   std::vector<char> header = create_npy_header<T>(true_data_shape);
155*4882a593Smuzhiyun   size_t            nels   = std::accumulate(shape.begin(), shape.end(), 1, std::multiplies<size_t>());
156*4882a593Smuzhiyun 
157*4882a593Smuzhiyun   fseek(fp, 0, SEEK_SET);
158*4882a593Smuzhiyun   fwrite(&header[0], sizeof(char), header.size(), fp);
159*4882a593Smuzhiyun   fseek(fp, 0, SEEK_END);
160*4882a593Smuzhiyun   fwrite(data, sizeof(T), nels, fp);
161*4882a593Smuzhiyun   fclose(fp);
162*4882a593Smuzhiyun   return 0;
163*4882a593Smuzhiyun }
164*4882a593Smuzhiyun 
165*4882a593Smuzhiyun template <typename T>
166*4882a593Smuzhiyun void npz_save(std::string zipname, std::string fname, const T* data, const std::vector<size_t>& shape,
167*4882a593Smuzhiyun               std::string mode = "w")
168*4882a593Smuzhiyun {
169*4882a593Smuzhiyun   // first, append a .npy to the fname
170*4882a593Smuzhiyun   fname += ".npy";
171*4882a593Smuzhiyun 
172*4882a593Smuzhiyun   // now, on with the show
173*4882a593Smuzhiyun   FILE*             fp                   = NULL;
174*4882a593Smuzhiyun   uint16_t          nrecs                = 0;
175*4882a593Smuzhiyun   size_t            global_header_offset = 0;
176*4882a593Smuzhiyun   std::vector<char> global_header;
177*4882a593Smuzhiyun 
178*4882a593Smuzhiyun   if (mode == "a")
179*4882a593Smuzhiyun     fp = fopen(zipname.c_str(), "r+b");
180*4882a593Smuzhiyun 
181*4882a593Smuzhiyun   if (fp) {
182*4882a593Smuzhiyun     // zip file exists. we need to add a new npy file to it.
183*4882a593Smuzhiyun     // first read the footer. this gives us the offset and size of the global header
184*4882a593Smuzhiyun     // then read and store the global header.
185*4882a593Smuzhiyun     // below, we will write the the new data at the start of the global header then append the global header and footer
186*4882a593Smuzhiyun     // below it
187*4882a593Smuzhiyun     size_t global_header_size;
188*4882a593Smuzhiyun     parse_zip_footer(fp, nrecs, global_header_size, global_header_offset);
189*4882a593Smuzhiyun     fseek(fp, global_header_offset, SEEK_SET);
190*4882a593Smuzhiyun     global_header.resize(global_header_size);
191*4882a593Smuzhiyun     size_t res = fread(&global_header[0], sizeof(char), global_header_size, fp);
192*4882a593Smuzhiyun     if (res != global_header_size) {
193*4882a593Smuzhiyun       throw std::runtime_error("npz_save: header read error while adding to existing zip");
194*4882a593Smuzhiyun     }
195*4882a593Smuzhiyun     fseek(fp, global_header_offset, SEEK_SET);
196*4882a593Smuzhiyun   } else {
197*4882a593Smuzhiyun     fp = fopen(zipname.c_str(), "wb");
198*4882a593Smuzhiyun   }
199*4882a593Smuzhiyun 
200*4882a593Smuzhiyun   std::vector<char> npy_header = create_npy_header<T>(shape);
201*4882a593Smuzhiyun 
202*4882a593Smuzhiyun   size_t nels   = std::accumulate(shape.begin(), shape.end(), 1, std::multiplies<size_t>());
203*4882a593Smuzhiyun   size_t nbytes = nels * sizeof(T) + npy_header.size();
204*4882a593Smuzhiyun 
205*4882a593Smuzhiyun #if 0
206*4882a593Smuzhiyun   // get the CRC of the data to be added
207*4882a593Smuzhiyun   uint32_t crc = crc32(0L, (uint8_t*)&npy_header[0], npy_header.size());
208*4882a593Smuzhiyun   crc          = crc32(crc, (uint8_t*)data, nels * sizeof(T));
209*4882a593Smuzhiyun #else
210*4882a593Smuzhiyun   uint32_t crc = 0;
211*4882a593Smuzhiyun #endif
212*4882a593Smuzhiyun 
213*4882a593Smuzhiyun   // build the local header
214*4882a593Smuzhiyun   std::vector<char> local_header;
215*4882a593Smuzhiyun   local_header += "PK";                   // first part of sig
216*4882a593Smuzhiyun   local_header += (uint16_t)0x0403;       // second part of sig
217*4882a593Smuzhiyun   local_header += (uint16_t)20;           // min version to extract
218*4882a593Smuzhiyun   local_header += (uint16_t)0;            // general purpose bit flag
219*4882a593Smuzhiyun   local_header += (uint16_t)0;            // compression method
220*4882a593Smuzhiyun   local_header += (uint16_t)0;            // file last mod time
221*4882a593Smuzhiyun   local_header += (uint16_t)0;            // file last mod date
222*4882a593Smuzhiyun   local_header += (uint32_t)crc;          // crc
223*4882a593Smuzhiyun   local_header += (uint32_t)nbytes;       // compressed size
224*4882a593Smuzhiyun   local_header += (uint32_t)nbytes;       // uncompressed size
225*4882a593Smuzhiyun   local_header += (uint16_t)fname.size(); // fname length
226*4882a593Smuzhiyun   local_header += (uint16_t)0;            // extra field length
227*4882a593Smuzhiyun   local_header += fname;
228*4882a593Smuzhiyun 
229*4882a593Smuzhiyun   // build global header
230*4882a593Smuzhiyun   global_header += "PK";             // first part of sig
231*4882a593Smuzhiyun   global_header += (uint16_t)0x0201; // second part of sig
232*4882a593Smuzhiyun   global_header += (uint16_t)20;     // version made by
233*4882a593Smuzhiyun   global_header.insert(global_header.end(), local_header.begin() + 4, local_header.begin() + 30);
234*4882a593Smuzhiyun   global_header += (uint16_t)0; // file comment length
235*4882a593Smuzhiyun   global_header += (uint16_t)0; // disk number where file starts
236*4882a593Smuzhiyun   global_header += (uint16_t)0; // internal file attributes
237*4882a593Smuzhiyun   global_header += (uint32_t)0; // external file attributes
238*4882a593Smuzhiyun   global_header += (uint32_t)
239*4882a593Smuzhiyun     global_header_offset; // relative offset of local file header, since it begins where the global header used to begin
240*4882a593Smuzhiyun   global_header += fname;
241*4882a593Smuzhiyun 
242*4882a593Smuzhiyun   // build footer
243*4882a593Smuzhiyun   std::vector<char> footer;
244*4882a593Smuzhiyun   footer += "PK";                           // first part of sig
245*4882a593Smuzhiyun   footer += (uint16_t)0x0605;               // second part of sig
246*4882a593Smuzhiyun   footer += (uint16_t)0;                    // number of this disk
247*4882a593Smuzhiyun   footer += (uint16_t)0;                    // disk where footer starts
248*4882a593Smuzhiyun   footer += (uint16_t)(nrecs + 1);          // number of records on this disk
249*4882a593Smuzhiyun   footer += (uint16_t)(nrecs + 1);          // total number of records
250*4882a593Smuzhiyun   footer += (uint32_t)global_header.size(); // nbytes of global headers
251*4882a593Smuzhiyun   footer +=
252*4882a593Smuzhiyun     (uint32_t)(global_header_offset + nbytes + local_header.size()); // offset of start of global headers, since global
253*4882a593Smuzhiyun                                                                      // header now starts after newly written array
254*4882a593Smuzhiyun   footer += (uint16_t)0;                                             // zip file comment length
255*4882a593Smuzhiyun 
256*4882a593Smuzhiyun   // write everything
257*4882a593Smuzhiyun   fwrite(&local_header[0], sizeof(char), local_header.size(), fp);
258*4882a593Smuzhiyun   fwrite(&npy_header[0], sizeof(char), npy_header.size(), fp);
259*4882a593Smuzhiyun   fwrite(data, sizeof(T), nels, fp);
260*4882a593Smuzhiyun   fwrite(&global_header[0], sizeof(char), global_header.size(), fp);
261*4882a593Smuzhiyun   fwrite(&footer[0], sizeof(char), footer.size(), fp);
262*4882a593Smuzhiyun   fclose(fp);
263*4882a593Smuzhiyun }
264*4882a593Smuzhiyun 
265*4882a593Smuzhiyun template <typename T>
266*4882a593Smuzhiyun void npy_save(std::string fname, const std::vector<T> data, std::string mode = "w")
267*4882a593Smuzhiyun {
268*4882a593Smuzhiyun   std::vector<size_t> shape;
269*4882a593Smuzhiyun   shape.push_back(data.size());
270*4882a593Smuzhiyun   npy_save(fname, &data[0], shape, mode);
271*4882a593Smuzhiyun }
272*4882a593Smuzhiyun 
273*4882a593Smuzhiyun template <typename T>
274*4882a593Smuzhiyun void npz_save(std::string zipname, std::string fname, const std::vector<T> data, std::string mode = "w")
275*4882a593Smuzhiyun {
276*4882a593Smuzhiyun   std::vector<size_t> shape;
277*4882a593Smuzhiyun   shape.push_back(data.size());
278*4882a593Smuzhiyun   npz_save(zipname, fname, &data[0], shape, mode);
279*4882a593Smuzhiyun }
280*4882a593Smuzhiyun 
281*4882a593Smuzhiyun template <typename T>
create_npy_header(const std::vector<size_t> & shape)282*4882a593Smuzhiyun std::vector<char> create_npy_header(const std::vector<size_t>& shape)
283*4882a593Smuzhiyun {
284*4882a593Smuzhiyun   const char* tpye_name = typeid(T).name();
285*4882a593Smuzhiyun   std::vector<char> dict;
286*4882a593Smuzhiyun   dict += "{'descr': '";
287*4882a593Smuzhiyun   dict += BigEndianTest(sizeof(T));
288*4882a593Smuzhiyun   if (std::string(tpye_name) == "N4rknn7float16E") {
289*4882a593Smuzhiyun     dict += "f";
290*4882a593Smuzhiyun   } else {
291*4882a593Smuzhiyun     dict += map_type(typeid(T));
292*4882a593Smuzhiyun   }
293*4882a593Smuzhiyun   dict += std::to_string(sizeof(T));
294*4882a593Smuzhiyun   dict += "', 'fortran_order': False, 'shape': (";
295*4882a593Smuzhiyun   dict += std::to_string(shape[0]);
296*4882a593Smuzhiyun   for (size_t i = 1; i < shape.size(); i++) {
297*4882a593Smuzhiyun     dict += ", ";
298*4882a593Smuzhiyun     dict += std::to_string(shape[i]);
299*4882a593Smuzhiyun   }
300*4882a593Smuzhiyun   if (shape.size() == 1)
301*4882a593Smuzhiyun     dict += ",";
302*4882a593Smuzhiyun   dict += "), }";
303*4882a593Smuzhiyun   // pad with spaces so that preamble+dict is modulo 16 bytes. preamble is 10 bytes. dict needs to end with \n
304*4882a593Smuzhiyun   int remainder = 16 - (10 + dict.size()) % 16;
305*4882a593Smuzhiyun   dict.insert(dict.end(), remainder, ' ');
306*4882a593Smuzhiyun   dict.back() = '\n';
307*4882a593Smuzhiyun 
308*4882a593Smuzhiyun   std::vector<char> header;
309*4882a593Smuzhiyun   header += (char)0x93;
310*4882a593Smuzhiyun   header += "NUMPY";
311*4882a593Smuzhiyun   header += (char)0x01; // major version of numpy format
312*4882a593Smuzhiyun   header += (char)0x00; // minor version of numpy format
313*4882a593Smuzhiyun   header += (uint16_t)dict.size();
314*4882a593Smuzhiyun   header.insert(header.end(), dict.begin(), dict.end());
315*4882a593Smuzhiyun 
316*4882a593Smuzhiyun   return header;
317*4882a593Smuzhiyun }
318*4882a593Smuzhiyun 
319*4882a593Smuzhiyun } // namespace cnpy
320*4882a593Smuzhiyun 
321*4882a593Smuzhiyun #endif
322