ArmNN
 25.02
All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros Pages
armnnNumpy Namespace Reference

Classes

struct  HeaderInfo
 from the numpy file to be parsed. More...
 
struct  Header
 from the numpy file to be parsed. More...
 

Functions

void CreateHeaderInfo (std::ifstream &ifStream, HeaderInfo &headerInfo)
 
std::string getSubstring (std::string fullString, std::string substringStart, std::string substringEnd, bool removeStartChar=0, bool includeEndChar=0)
 Primarily used to isolate values from header dictionary. More...
 
void parseShape (Header &header, std::string &shapeString)
 
void CreateHeader (std::ifstream &ifStream, HeaderInfo &headerInfo, Header &header)
 
template<typename T >
void ReadData (std::ifstream &ifStream, T *tensor, const unsigned int &numElements)
 
armnn::DataType getArmNNDataType (std::string &descr)
 
std::string getNumpyDescr (armnn::DataType dType)
 
template<typename T >
bool compareCTypes (std::string &descr)
 
unsigned int getNumElements (Header &header)
 
template<typename T >
void WriteToNumpyFile (const std::string &outputTensorFileName, const T *const array, const unsigned int numElements, armnn::DataType dataType, const armnn::TensorShape &shape)
 

Function Documentation

◆ compareCTypes()

bool armnnNumpy::compareCTypes ( std::string &  descr)
inline

Definition at line 279 of file Numpy.hpp.

280  {
281  if(descr.find("f4") != std::string::npos || descr.find("f8") != std::string::npos)
282  {
283  return std::is_same<T, float>::value;
284  }
285  else if (descr.find("i8") != std::string::npos)
286  {
287  return std::is_same<T, int64_t>::value;
288  }
289  else if (descr.find("i4") != std::string::npos)
290  {
291  return std::is_same<T, int32_t>::value;
292  }
293  else if (descr.find("i2") != std::string::npos)
294  {
295  return std::is_same<T, int16_t>::value;
296  }
297  else if (descr.find("i1") != std::string::npos)
298  {
299  return std::is_same<T, int8_t>::value;
300  }
301  else if (descr.find("u1") != std::string::npos)
302  {
303  return std::is_same<T, uint8_t>::value;
304  }
305  else
306  {
307  throw armnn::Exception(fmt::format("Numpy data type:{} not supported. {}",
308  descr, CHECK_LOCATION().AsString()));
309  }
310  }
#define CHECK_LOCATION()
Definition: Exceptions.hpp:203
Base class for all ArmNN exceptions so that users can filter to just those.
Definition: Exceptions.hpp:47

References CHECK_LOCATION.

◆ CreateHeader()

void armnnNumpy::CreateHeader ( std::ifstream &  ifStream,
HeaderInfo headerInfo,
Header header 
)
inline

Definition at line 157 of file Numpy.hpp.

158  {
159  char stringBuffer[headerInfo.m_HeaderLen];
160  ifStream.read(stringBuffer, static_cast<std::streamsize>(headerInfo.m_HeaderLen));
161 
162  header.m_HeaderString = std::string(stringBuffer, headerInfo.m_HeaderLen);
163  // Remove new line character at the end of the string
164  if(header.m_HeaderString.back() == '\n')
165  {
166  header.m_HeaderString.pop_back();
167  }
168 
169  // Remove whitespace from the string.
170  // std::remove shuffles the string by place all whitespace at the end and
171  // returning the start location of the shuffled whitespace.
172  // std::string.erase then deletes the whitespace by deleting characters
173  // between the iterator returned from std::remove and the end of the std::string
174  std::string::iterator whitespaceSubstringStart = std::remove(header.m_HeaderString.begin(),
175  header.m_HeaderString.end(), ' ');
176  header.m_HeaderString.erase(whitespaceSubstringStart, header.m_HeaderString.end());
177 
178  // The order of the dictionary should be alphabetical,
179  // however this is not guarenteed so we have to search for the string.
180  // Because of this we do some weird parsing using std::string.find and some magic patterns
181  //
182  // For the description value, we include the end character from the first substring
183  // to help us find the value in the second substring. This should return with a "," at the end.
184  // Since we previously left the "," at the end of the substring,
185  // we can use it to find the end of the description value and then remove it after.
186  std::string descrString = getSubstring(header.m_HeaderString, "'descr", ",", 0, 1);
187  header.m_DescrString = getSubstring(descrString, ":", ",", 1);
188 
189  // Fortran order is a python boolean literal, we simply look for a comma to delimit this pair.
190  // Since this is a boolean, both true and false end in an "e" without appearing in between.
191  // It is not great, but it is the easiest way to find the end.
192  // We have to ensure we include this e in the substring.
193  // Since this is a boolean we can check if the string contains
194  // either true or false and set the variable as required
195  std::string fortranOrderString = getSubstring(header.m_HeaderString, "'fortran_order", ",");
196  fortranOrderString = getSubstring(fortranOrderString, ":", "e", 1, 1);
197  header.m_FortranOrder = fortranOrderString.find("True") != std::string::npos ? true : false;
198 
199  // The shape is a python tuple so we search for the closing bracket of the tuple.
200  // We include the end character to help us isolate the value substring.
201  // We can extract the inside of the tuple by searching for opening and closing brackets.
202  // We can then remove the brackets isolating the inside of the tuple.
203  // We then need to parse the string into a vector of unsigned integers
204  std::string shapeString = getSubstring(header.m_HeaderString, "'shape", ")", 0, 1);
205  shapeString = getSubstring(shapeString, "(", ")", 1, 0);
206  parseShape(header, shapeString);
207  }
void parseShape(Header &header, std::string &shapeString)
Definition: Numpy.hpp:147
std::string getSubstring(std::string fullString, std::string substringStart, std::string substringEnd, bool removeStartChar=0, bool includeEndChar=0)
Primarily used to isolate values from header dictionary.
Definition: Numpy.hpp:125

References getSubstring(), Header::m_DescrString, Header::m_FortranOrder, HeaderInfo::m_HeaderLen, Header::m_HeaderString, and parseShape().

◆ CreateHeaderInfo()

void armnnNumpy::CreateHeaderInfo ( std::ifstream &  ifStream,
HeaderInfo headerInfo 
)
inline

Definition at line 51 of file Numpy.hpp.

52  {
53  // A Numpy header consists of:
54  // a magic string "x93NUMPY"
55  // 1 byte for the major version
56  // 1 byte for the minor version
57  // 2 or 4 bytes for the header length
58  // More info: https://numpy.org/devdocs/reference/generated/numpy.lib.format.html
59  char buffer[headerInfo.m_MagicStringLength + 2lu];
60  ifStream.read(buffer, headerInfo.m_MagicStringLength + 2);
61 
62  if (!ifStream)
63  {
64  throw armnn::Exception(
65  fmt::format("Failed to create numpy header info at {}",
66  CHECK_LOCATION().AsString()));
67  }
68  // Verify that the numpy is in the valid format by checking for the magic string
69  int compare_result = ::memcmp(buffer, headerInfo.m_MagicString, headerInfo.m_MagicStringLength);
70  if (compare_result != 0) {
71  throw armnn::Exception(fmt::format("Numpy does not contain magic string. Can not parse invalid numpy {}",
72  CHECK_LOCATION().AsString()));
73  }
74 
75  headerInfo.m_MajorVersion = buffer[headerInfo.m_MagicStringLength];
76  headerInfo.m_MinorVersion = buffer[headerInfo.m_MagicStringLength + 1];
77  if(headerInfo.m_MajorVersion == 1 && headerInfo.m_MinorVersion == 0)
78  {
79  ifStream.read(headerInfo.m_HeaderLenBytes, 2);
80  // Header len is written in little endian, so we do a quick test
81  // to check the machines endianness
82  int i = 1;
83  if (*(reinterpret_cast<char *>(&i)) == 1)
84  {
85  headerInfo.m_HeaderLen = static_cast<unsigned>(headerInfo.m_HeaderLenBytes[0]) |
86  (static_cast<unsigned>(headerInfo.m_HeaderLenBytes[1] << 8));
87  }
88  else
89  {
90  headerInfo.m_HeaderLen = static_cast<unsigned>(headerInfo.m_HeaderLenBytes[1]) |
91  (static_cast<unsigned>(headerInfo.m_HeaderLenBytes[0] << 8));
92  }
93  }
94  else if (headerInfo.m_MajorVersion == 2 && headerInfo.m_MinorVersion == 0)
95  {
96  ifStream.read(headerInfo.m_HeaderLenBytes, 4);
97  // Header len is written in little endian, so we do a quick test
98  // to check the machines endianness
99  int i = 1;
100  if (*(reinterpret_cast<char *>(&i)) == 1)
101  {
102  headerInfo.m_HeaderLen = static_cast<unsigned>(headerInfo.m_HeaderLenBytes[0] << 0) |
103  static_cast<unsigned>(headerInfo.m_HeaderLenBytes[1] << 8) |
104  static_cast<unsigned>(headerInfo.m_HeaderLenBytes[2] << 16) |
105  static_cast<unsigned>(headerInfo.m_HeaderLenBytes[3] << 24);
106  }
107  else
108  {
109  headerInfo.m_HeaderLen = static_cast<unsigned>(headerInfo.m_HeaderLenBytes[3] << 0) |
110  static_cast<unsigned>(headerInfo.m_HeaderLenBytes[2] << 8) |
111  static_cast<unsigned>(headerInfo.m_HeaderLenBytes[1] << 16) |
112  static_cast<unsigned>(headerInfo.m_HeaderLenBytes[0] << 24);
113  }
114  }
115  else
116  {
117  throw armnn::ParseException(fmt::format("Unable to parser Numpy version {}.{} {}",
118  headerInfo.m_MajorVersion,
119  headerInfo.m_MinorVersion,
120  CHECK_LOCATION().AsString()));
121  }
122  }

References CHECK_LOCATION, HeaderInfo::m_HeaderLen, HeaderInfo::m_HeaderLenBytes, HeaderInfo::m_MagicString, HeaderInfo::m_MagicStringLength, HeaderInfo::m_MajorVersion, and HeaderInfo::m_MinorVersion.

◆ getArmNNDataType()

armnn::DataType armnnNumpy::getArmNNDataType ( std::string &  descr)
inline

Definition at line 216 of file Numpy.hpp.

217  {
218  if(descr.find("f4") != std::string::npos || descr.find("f8") != std::string::npos)
219  {
221  }
222  else if (descr.find("f2") != std::string::npos)
223  {
225  }
226  else if (descr.find("i8") != std::string::npos)
227  {
229  }
230  else if (descr.find("i4") != std::string::npos)
231  {
233  }
234  else if (descr.find("i2") != std::string::npos)
235  {
237  }
238  else if (descr.find("i1") != std::string::npos)
239  {
241  }
242  else if (descr.find("u1") != std::string::npos)
243  {
245  }
246  else
247  {
248  throw armnn::Exception(fmt::format("Numpy data type:{} not supported. {}",
249  descr, CHECK_LOCATION().AsString()));
250  }
251  }

References CHECK_LOCATION, armnn::Float16, armnn::Float32, armnn::QAsymmU8, armnn::QSymmS16, armnn::QSymmS8, armnn::Signed32, and armnn::Signed64.

◆ getNumElements()

unsigned int armnnNumpy::getNumElements ( Header header)
inline

Definition at line 312 of file Numpy.hpp.

313  {
314  unsigned int numEls = 1;
315  for (auto dim: header.m_Shape)
316  {
317  numEls *= dim;
318  }
319 
320  return numEls;
321  }

References Header::m_Shape.

◆ getNumpyDescr()

std::string armnnNumpy::getNumpyDescr ( armnn::DataType  dType)
inline

Definition at line 253 of file Numpy.hpp.

254  {
255  switch(dType)
256  {
258  return "f" + std::to_string(sizeof(float)); // size of float can be 4 or 8
260  return "f2";
262  return "i8";
264  return "i4";
266  return "i2";
269  return "i1";
271  return "u1";
272  default:
273  throw armnn::Exception(fmt::format("ArmNN to Numpy data type:{} not supported. {}",
274  dType, CHECK_LOCATION().AsString()));
275  }
276  }

References CHECK_LOCATION, armnn::Float16, armnn::Float32, armnn::QAsymmS8, armnn::QAsymmU8, armnn::QSymmS16, armnn::QSymmS8, armnn::Signed32, and armnn::Signed64.

Referenced by WriteToNumpyFile().

◆ getSubstring()

std::string armnnNumpy::getSubstring ( std::string  fullString,
std::string  substringStart,
std::string  substringEnd,
bool  removeStartChar = 0,
bool  includeEndChar = 0 
)
inline

Primarily used to isolate values from header dictionary.

Definition at line 125 of file Numpy.hpp.

130  {
131  size_t startPos = fullString.find(substringStart);
132  size_t endPos = fullString.find(substringEnd, startPos);
133  if (startPos == std::string::npos || endPos == std::string::npos)
134  {
135  throw armnn::ParseException(fmt::format("Unable to find {} in numpy file.",
136  CHECK_LOCATION().AsString()));
137  }
138 
139  // std::string.substr takes the starting position and the length of the substring.
140  // To calculate the length we subtract the start position from the end position.
141  // We also add a boolean on whether or not we want to include the character used to find endPos
142  startPos+= removeStartChar;
143  endPos += includeEndChar;
144  return fullString.substr(startPos, endPos - startPos);
145  }

References CHECK_LOCATION.

Referenced by CreateHeader().

◆ parseShape()

void armnnNumpy::parseShape ( Header header,
std::string &  shapeString 
)
inline

Definition at line 147 of file Numpy.hpp.

148  {
149  std::istringstream shapeStringStream(shapeString);
150  std::string token;
151  while(getline(shapeStringStream, token, ','))
152  {
153  header.m_Shape.push_back(static_cast<uint32_t >(std::stoi(token)));
154  }
155  }

References Header::m_Shape.

Referenced by CreateHeader().

◆ ReadData()

void armnnNumpy::ReadData ( std::ifstream &  ifStream,
T *  tensor,
const unsigned int &  numElements 
)
inline

Definition at line 210 of file Numpy.hpp.

211  {
212  ifStream.read(reinterpret_cast<char *>(tensor), sizeof(T) * numElements);
213  }

◆ WriteToNumpyFile()

void armnnNumpy::WriteToNumpyFile ( const std::string &  outputTensorFileName,
const T *const  array,
const unsigned int  numElements,
armnn::DataType  dataType,
const armnn::TensorShape shape 
)
inline

Definition at line 326 of file Numpy.hpp.

331  {
332  std::ofstream out(outputTensorFileName, std::ofstream::binary);
333 
334  // write header
335  {
336  // Setup string of tensor shape in format (x0, x1, x2, ..)
337  std::string shapeStr = "(";
338  for (uint32_t i = 0; i < shape.GetNumDimensions()-1; i++)
339  {
340  shapeStr = shapeStr + std::to_string(shape[i]) + ", ";
341  }
342  shapeStr = shapeStr + std::to_string(shape[shape.GetNumDimensions()-1]) + ")";
343 
344  int i = 1;
345  std::string endianChar = (*(reinterpret_cast<char *>(&i))) ? "<" : ">";
346  std::string dataTypeStr = getNumpyDescr(dataType);
347  std::string fortranOrder = "False";
348  std::string headerStr = "{'descr': '" + endianChar + dataTypeStr +
349  "', 'fortran_order': " + fortranOrder +
350  ", 'shape': " + shapeStr + ", }";
351 
352  armnnNumpy::HeaderInfo headerInfo;
353 
354  // Header is composed of:
355  // - 6 byte magic string
356  // - 2 byte major and minor version
357  // - 2 byte (v1.0) / 4 byte (v2.0) little-endian unsigned int
358  // - headerStr.length() bytes
359  // - 1 byte for newline termination (\n)
360  size_t length = headerInfo.m_MagicStringLength + 2 + 2 + headerStr.length() + 1;
361  uint8_t major_version = 1;
362 
363  // for numpy major version 2, add extra 2 bytes for little-endian int (total 4 bytes)
364  if (length >= 255 * 255)
365  {
366  length += 2;
367  major_version = 2;
368  }
369 
370  // Pad with spaces so header length is modulo 16 bytes.
371  size_t padding_length = 16 - length % 16;
372  std::string padding(padding_length, ' ');
373 
374  // write magic string
375  out.write(headerInfo.m_MagicString, headerInfo.m_MagicStringLength);
376  out.put(major_version);
377  out.put(0); // minor version
378 
379  // write header length
380  if (major_version == 1)
381  {
382  auto header_len = static_cast<uint16_t>(headerStr.length() + padding.length() + 1);
383 
384  std::array<uint8_t, 2> header_len_16{static_cast<uint8_t>((header_len >> 0) & 0xff),
385  static_cast<uint8_t>((header_len >> 8) & 0xff)};
386  out.write(reinterpret_cast<char *>(header_len_16.data()), 2);
387  }
388  else
389  {
390  auto header_len = static_cast<uint32_t>(headerStr.length() + padding.length() + 1);
391 
392  std::array<uint8_t, 4> header_len_32{
393  static_cast<uint8_t>((header_len >> 0) & 0xff), static_cast<uint8_t>((header_len >> 8) & 0xff),
394  static_cast<uint8_t>((header_len >> 16) & 0xff), static_cast<uint8_t>((header_len >> 24) & 0xff)};
395  out.write(reinterpret_cast<char *>(header_len_32.data()), 4);
396  }
397 
398  out << headerStr << padding << '\n';
399  }
400 
401  // write tensor data to file
402  out.write(reinterpret_cast<const char *>(array), sizeof(T) * numElements);
403  }
unsigned int GetNumDimensions() const
Function that returns the tensor rank.
Definition: Tensor.cpp:174
std::string getNumpyDescr(armnn::DataType dType)
Definition: Numpy.hpp:253
from the numpy file to be parsed.
Definition: Numpy.hpp:29
const char m_MagicString[7]
Definition: Numpy.hpp:33
const uint8_t m_MagicStringLength
Definition: Numpy.hpp:32

References TensorShape::GetNumDimensions(), getNumpyDescr(), HeaderInfo::m_MagicString, and HeaderInfo::m_MagicStringLength.