130fdc8d8SChris Lattner //===-- StringExtractor.cpp -------------------------------------*- C++ -*-===// 230fdc8d8SChris Lattner // 330fdc8d8SChris Lattner // The LLVM Compiler Infrastructure 430fdc8d8SChris Lattner // 530fdc8d8SChris Lattner // This file is distributed under the University of Illinois Open Source 630fdc8d8SChris Lattner // License. See LICENSE.TXT for details. 730fdc8d8SChris Lattner // 830fdc8d8SChris Lattner //===----------------------------------------------------------------------===// 930fdc8d8SChris Lattner 10c982c768SGreg Clayton #include "Utility/StringExtractor.h" 1130fdc8d8SChris Lattner 1230fdc8d8SChris Lattner // C Includes 13*78709173SStephen Wilson #include <stdlib.h> 14*78709173SStephen Wilson 1530fdc8d8SChris Lattner // C++ Includes 1630fdc8d8SChris Lattner // Other libraries and framework includes 1730fdc8d8SChris Lattner // Project includes 1830fdc8d8SChris Lattner 1930fdc8d8SChris Lattner static inline int 2030fdc8d8SChris Lattner xdigit_to_sint (char ch) 2130fdc8d8SChris Lattner { 2230fdc8d8SChris Lattner if (ch >= 'a' && ch <= 'f') 2330fdc8d8SChris Lattner return 10 + ch - 'a'; 241e89cd80SBenjamin Kramer if (ch >= 'A' && ch <= 'F') 251e89cd80SBenjamin Kramer return 10 + ch - 'A'; 2630fdc8d8SChris Lattner return ch - '0'; 2730fdc8d8SChris Lattner } 2830fdc8d8SChris Lattner 2930fdc8d8SChris Lattner static inline unsigned int 3030fdc8d8SChris Lattner xdigit_to_uint (uint8_t ch) 3130fdc8d8SChris Lattner { 3230fdc8d8SChris Lattner if (ch >= 'a' && ch <= 'f') 3330fdc8d8SChris Lattner return 10u + ch - 'a'; 341e89cd80SBenjamin Kramer if (ch >= 'A' && ch <= 'F') 351e89cd80SBenjamin Kramer return 10u + ch - 'A'; 3630fdc8d8SChris Lattner return ch - '0'; 3730fdc8d8SChris Lattner } 3830fdc8d8SChris Lattner 3930fdc8d8SChris Lattner //---------------------------------------------------------------------- 4030fdc8d8SChris Lattner // StringExtractor constructor 4130fdc8d8SChris Lattner //---------------------------------------------------------------------- 4230fdc8d8SChris Lattner StringExtractor::StringExtractor() : 4330fdc8d8SChris Lattner m_packet(), 4430fdc8d8SChris Lattner m_index (0) 4530fdc8d8SChris Lattner { 4630fdc8d8SChris Lattner } 4730fdc8d8SChris Lattner 4830fdc8d8SChris Lattner 4930fdc8d8SChris Lattner StringExtractor::StringExtractor(const char *packet_cstr) : 5030fdc8d8SChris Lattner m_packet(), 5130fdc8d8SChris Lattner m_index (0) 5230fdc8d8SChris Lattner { 5330fdc8d8SChris Lattner if (packet_cstr) 5430fdc8d8SChris Lattner m_packet.assign (packet_cstr); 5530fdc8d8SChris Lattner } 5630fdc8d8SChris Lattner 5730fdc8d8SChris Lattner 5830fdc8d8SChris Lattner //---------------------------------------------------------------------- 5930fdc8d8SChris Lattner // StringExtractor copy constructor 6030fdc8d8SChris Lattner //---------------------------------------------------------------------- 6130fdc8d8SChris Lattner StringExtractor::StringExtractor(const StringExtractor& rhs) : 6230fdc8d8SChris Lattner m_packet (rhs.m_packet), 6330fdc8d8SChris Lattner m_index (rhs.m_index) 6430fdc8d8SChris Lattner { 6530fdc8d8SChris Lattner 6630fdc8d8SChris Lattner } 6730fdc8d8SChris Lattner 6830fdc8d8SChris Lattner //---------------------------------------------------------------------- 6930fdc8d8SChris Lattner // StringExtractor assignment operator 7030fdc8d8SChris Lattner //---------------------------------------------------------------------- 7130fdc8d8SChris Lattner const StringExtractor& 7230fdc8d8SChris Lattner StringExtractor::operator=(const StringExtractor& rhs) 7330fdc8d8SChris Lattner { 7430fdc8d8SChris Lattner if (this != &rhs) 7530fdc8d8SChris Lattner { 7630fdc8d8SChris Lattner m_packet = rhs.m_packet; 7730fdc8d8SChris Lattner m_index = rhs.m_index; 7830fdc8d8SChris Lattner 7930fdc8d8SChris Lattner } 8030fdc8d8SChris Lattner return *this; 8130fdc8d8SChris Lattner } 8230fdc8d8SChris Lattner 8330fdc8d8SChris Lattner //---------------------------------------------------------------------- 8430fdc8d8SChris Lattner // Destructor 8530fdc8d8SChris Lattner //---------------------------------------------------------------------- 8630fdc8d8SChris Lattner StringExtractor::~StringExtractor() 8730fdc8d8SChris Lattner { 8830fdc8d8SChris Lattner } 8930fdc8d8SChris Lattner 9030fdc8d8SChris Lattner 9130fdc8d8SChris Lattner char 9230fdc8d8SChris Lattner StringExtractor::GetChar (char fail_value) 9330fdc8d8SChris Lattner { 9430fdc8d8SChris Lattner if (m_index < m_packet.size()) 9530fdc8d8SChris Lattner { 9630fdc8d8SChris Lattner char ch = m_packet[m_index]; 9730fdc8d8SChris Lattner ++m_index; 9830fdc8d8SChris Lattner return ch; 9930fdc8d8SChris Lattner } 10030fdc8d8SChris Lattner m_index = UINT32_MAX; 10130fdc8d8SChris Lattner return fail_value; 10230fdc8d8SChris Lattner } 10330fdc8d8SChris Lattner 10430fdc8d8SChris Lattner uint32_t 10530fdc8d8SChris Lattner StringExtractor::GetNumHexASCIICharsAtFilePos (uint32_t max) const 10630fdc8d8SChris Lattner { 10730fdc8d8SChris Lattner uint32_t idx = m_index; 10830fdc8d8SChris Lattner const size_t size = m_packet.size(); 10930fdc8d8SChris Lattner while (idx < size && idx - m_index < max && isxdigit(m_packet[idx])) 11030fdc8d8SChris Lattner ++idx; 11130fdc8d8SChris Lattner return idx - m_index; 11230fdc8d8SChris Lattner } 11330fdc8d8SChris Lattner //---------------------------------------------------------------------- 11430fdc8d8SChris Lattner // Extract a signed character from two hex ASCII chars in the packet 11530fdc8d8SChris Lattner // string 11630fdc8d8SChris Lattner //---------------------------------------------------------------------- 11730fdc8d8SChris Lattner int8_t 11830fdc8d8SChris Lattner StringExtractor::GetHexS8 (int8_t fail_value) 11930fdc8d8SChris Lattner { 12030fdc8d8SChris Lattner if (GetNumHexASCIICharsAtFilePos(2)) 12130fdc8d8SChris Lattner { 12230fdc8d8SChris Lattner char hi_nibble_char = m_packet[m_index]; 12330fdc8d8SChris Lattner char lo_nibble_char = m_packet[m_index+1]; 12430fdc8d8SChris Lattner 12530fdc8d8SChris Lattner if (isxdigit(hi_nibble_char) && isxdigit(lo_nibble_char)) 12630fdc8d8SChris Lattner { 12730fdc8d8SChris Lattner char hi_nibble = xdigit_to_sint (hi_nibble_char); 12830fdc8d8SChris Lattner char lo_nibble = xdigit_to_sint (lo_nibble_char); 12930fdc8d8SChris Lattner m_index += 2; 13030fdc8d8SChris Lattner return (hi_nibble << 4) + lo_nibble; 13130fdc8d8SChris Lattner } 13230fdc8d8SChris Lattner } 13330fdc8d8SChris Lattner m_index = UINT32_MAX; 13430fdc8d8SChris Lattner return fail_value; 13530fdc8d8SChris Lattner } 13630fdc8d8SChris Lattner 13730fdc8d8SChris Lattner //---------------------------------------------------------------------- 13830fdc8d8SChris Lattner // Extract an unsigned character from two hex ASCII chars in the packet 13930fdc8d8SChris Lattner // string 14030fdc8d8SChris Lattner //---------------------------------------------------------------------- 14130fdc8d8SChris Lattner uint8_t 14230fdc8d8SChris Lattner StringExtractor::GetHexU8 (uint8_t fail_value) 14330fdc8d8SChris Lattner { 14430fdc8d8SChris Lattner if (GetNumHexASCIICharsAtFilePos(2)) 14530fdc8d8SChris Lattner { 14630fdc8d8SChris Lattner uint8_t hi_nibble_char = m_packet[m_index]; 14730fdc8d8SChris Lattner uint8_t lo_nibble_char = m_packet[m_index+1]; 14830fdc8d8SChris Lattner 14930fdc8d8SChris Lattner if (isxdigit(hi_nibble_char) && isxdigit(lo_nibble_char)) 15030fdc8d8SChris Lattner { 15171337622SGreg Clayton uint8_t hi_nibble = xdigit_to_uint (hi_nibble_char); 15271337622SGreg Clayton uint8_t lo_nibble = xdigit_to_uint (lo_nibble_char); 15330fdc8d8SChris Lattner m_index += 2; 15430fdc8d8SChris Lattner return (hi_nibble << 4) + lo_nibble; 15530fdc8d8SChris Lattner } 15630fdc8d8SChris Lattner } 15730fdc8d8SChris Lattner m_index = UINT32_MAX; 15830fdc8d8SChris Lattner return fail_value; 15930fdc8d8SChris Lattner } 16030fdc8d8SChris Lattner 16130fdc8d8SChris Lattner uint32_t 16232e0a750SGreg Clayton StringExtractor::GetU32 (uint32_t fail_value, int base) 16332e0a750SGreg Clayton { 16432e0a750SGreg Clayton if (m_index < m_packet.size()) 16532e0a750SGreg Clayton { 16632e0a750SGreg Clayton char *end = NULL; 16732e0a750SGreg Clayton const char *start = m_packet.c_str(); 16832e0a750SGreg Clayton const char *uint_cstr = start + m_index; 16932e0a750SGreg Clayton uint32_t result = ::strtoul (uint_cstr, &end, base); 17032e0a750SGreg Clayton 17132e0a750SGreg Clayton if (end && end != uint_cstr) 17232e0a750SGreg Clayton { 17332e0a750SGreg Clayton m_index = end - start; 17432e0a750SGreg Clayton return result; 17532e0a750SGreg Clayton } 17632e0a750SGreg Clayton } 17732e0a750SGreg Clayton return fail_value; 17832e0a750SGreg Clayton } 17932e0a750SGreg Clayton 18032e0a750SGreg Clayton 18132e0a750SGreg Clayton uint32_t 18230fdc8d8SChris Lattner StringExtractor::GetHexMaxU32 (bool little_endian, uint32_t fail_value) 18330fdc8d8SChris Lattner { 18430fdc8d8SChris Lattner uint32_t result = 0; 18530fdc8d8SChris Lattner uint32_t nibble_count = 0; 18630fdc8d8SChris Lattner 18730fdc8d8SChris Lattner if (little_endian) 18830fdc8d8SChris Lattner { 18930fdc8d8SChris Lattner uint32_t shift_amount = 0; 19030fdc8d8SChris Lattner while (m_index < m_packet.size() && ::isxdigit (m_packet[m_index])) 19130fdc8d8SChris Lattner { 19230fdc8d8SChris Lattner // Make sure we don't exceed the size of a uint32_t... 19330fdc8d8SChris Lattner if (nibble_count >= (sizeof(uint32_t) * 2)) 19430fdc8d8SChris Lattner { 19530fdc8d8SChris Lattner m_index = UINT32_MAX; 19630fdc8d8SChris Lattner return fail_value; 19730fdc8d8SChris Lattner } 19830fdc8d8SChris Lattner 19930fdc8d8SChris Lattner uint8_t nibble_lo; 20030fdc8d8SChris Lattner uint8_t nibble_hi = xdigit_to_sint (m_packet[m_index]); 20130fdc8d8SChris Lattner ++m_index; 20230fdc8d8SChris Lattner if (m_index < m_packet.size() && ::isxdigit (m_packet[m_index])) 20330fdc8d8SChris Lattner { 20430fdc8d8SChris Lattner nibble_lo = xdigit_to_sint (m_packet[m_index]); 20530fdc8d8SChris Lattner ++m_index; 20630fdc8d8SChris Lattner result |= ((uint32_t)nibble_hi << (shift_amount + 4)); 20730fdc8d8SChris Lattner result |= ((uint32_t)nibble_lo << shift_amount); 20830fdc8d8SChris Lattner nibble_count += 2; 20930fdc8d8SChris Lattner shift_amount += 8; 21030fdc8d8SChris Lattner } 21130fdc8d8SChris Lattner else 21230fdc8d8SChris Lattner { 21330fdc8d8SChris Lattner result |= ((uint32_t)nibble_hi << shift_amount); 21430fdc8d8SChris Lattner nibble_count += 1; 21530fdc8d8SChris Lattner shift_amount += 4; 21630fdc8d8SChris Lattner } 21730fdc8d8SChris Lattner 21830fdc8d8SChris Lattner } 21930fdc8d8SChris Lattner } 22030fdc8d8SChris Lattner else 22130fdc8d8SChris Lattner { 22230fdc8d8SChris Lattner while (m_index < m_packet.size() && ::isxdigit (m_packet[m_index])) 22330fdc8d8SChris Lattner { 22430fdc8d8SChris Lattner // Make sure we don't exceed the size of a uint32_t... 22530fdc8d8SChris Lattner if (nibble_count >= (sizeof(uint32_t) * 2)) 22630fdc8d8SChris Lattner { 22730fdc8d8SChris Lattner m_index = UINT32_MAX; 22830fdc8d8SChris Lattner return fail_value; 22930fdc8d8SChris Lattner } 23030fdc8d8SChris Lattner 23130fdc8d8SChris Lattner uint8_t nibble = xdigit_to_sint (m_packet[m_index]); 23230fdc8d8SChris Lattner // Big Endian 23330fdc8d8SChris Lattner result <<= 4; 23430fdc8d8SChris Lattner result |= nibble; 23530fdc8d8SChris Lattner 23630fdc8d8SChris Lattner ++m_index; 23730fdc8d8SChris Lattner ++nibble_count; 23830fdc8d8SChris Lattner } 23930fdc8d8SChris Lattner } 24030fdc8d8SChris Lattner return result; 24130fdc8d8SChris Lattner } 24230fdc8d8SChris Lattner 24330fdc8d8SChris Lattner uint64_t 24430fdc8d8SChris Lattner StringExtractor::GetHexMaxU64 (bool little_endian, uint64_t fail_value) 24530fdc8d8SChris Lattner { 24630fdc8d8SChris Lattner uint64_t result = 0; 24730fdc8d8SChris Lattner uint32_t nibble_count = 0; 24830fdc8d8SChris Lattner 24930fdc8d8SChris Lattner if (little_endian) 25030fdc8d8SChris Lattner { 25130fdc8d8SChris Lattner uint32_t shift_amount = 0; 25230fdc8d8SChris Lattner while (m_index < m_packet.size() && ::isxdigit (m_packet[m_index])) 25330fdc8d8SChris Lattner { 25430fdc8d8SChris Lattner // Make sure we don't exceed the size of a uint64_t... 25530fdc8d8SChris Lattner if (nibble_count >= (sizeof(uint64_t) * 2)) 25630fdc8d8SChris Lattner { 25730fdc8d8SChris Lattner m_index = UINT32_MAX; 25830fdc8d8SChris Lattner return fail_value; 25930fdc8d8SChris Lattner } 26030fdc8d8SChris Lattner 26130fdc8d8SChris Lattner uint8_t nibble_lo; 26230fdc8d8SChris Lattner uint8_t nibble_hi = xdigit_to_sint (m_packet[m_index]); 26330fdc8d8SChris Lattner ++m_index; 26430fdc8d8SChris Lattner if (m_index < m_packet.size() && ::isxdigit (m_packet[m_index])) 26530fdc8d8SChris Lattner { 26630fdc8d8SChris Lattner nibble_lo = xdigit_to_sint (m_packet[m_index]); 26730fdc8d8SChris Lattner ++m_index; 26830fdc8d8SChris Lattner result |= ((uint64_t)nibble_hi << (shift_amount + 4)); 26930fdc8d8SChris Lattner result |= ((uint64_t)nibble_lo << shift_amount); 27030fdc8d8SChris Lattner nibble_count += 2; 27130fdc8d8SChris Lattner shift_amount += 8; 27230fdc8d8SChris Lattner } 27330fdc8d8SChris Lattner else 27430fdc8d8SChris Lattner { 27530fdc8d8SChris Lattner result |= ((uint64_t)nibble_hi << shift_amount); 27630fdc8d8SChris Lattner nibble_count += 1; 27730fdc8d8SChris Lattner shift_amount += 4; 27830fdc8d8SChris Lattner } 27930fdc8d8SChris Lattner 28030fdc8d8SChris Lattner } 28130fdc8d8SChris Lattner } 28230fdc8d8SChris Lattner else 28330fdc8d8SChris Lattner { 28430fdc8d8SChris Lattner while (m_index < m_packet.size() && ::isxdigit (m_packet[m_index])) 28530fdc8d8SChris Lattner { 28630fdc8d8SChris Lattner // Make sure we don't exceed the size of a uint64_t... 28730fdc8d8SChris Lattner if (nibble_count >= (sizeof(uint64_t) * 2)) 28830fdc8d8SChris Lattner { 28930fdc8d8SChris Lattner m_index = UINT32_MAX; 29030fdc8d8SChris Lattner return fail_value; 29130fdc8d8SChris Lattner } 29230fdc8d8SChris Lattner 29330fdc8d8SChris Lattner uint8_t nibble = xdigit_to_sint (m_packet[m_index]); 29430fdc8d8SChris Lattner // Big Endian 29530fdc8d8SChris Lattner result <<= 4; 29630fdc8d8SChris Lattner result |= nibble; 29730fdc8d8SChris Lattner 29830fdc8d8SChris Lattner ++m_index; 29930fdc8d8SChris Lattner ++nibble_count; 30030fdc8d8SChris Lattner } 30130fdc8d8SChris Lattner } 30230fdc8d8SChris Lattner return result; 30330fdc8d8SChris Lattner } 30430fdc8d8SChris Lattner 30530fdc8d8SChris Lattner size_t 30630fdc8d8SChris Lattner StringExtractor::GetHexBytes (void *dst_void, size_t dst_len, uint8_t fail_fill_value) 30730fdc8d8SChris Lattner { 30830fdc8d8SChris Lattner uint8_t *dst = (uint8_t*)dst_void; 30930fdc8d8SChris Lattner size_t bytes_extracted = 0; 31030fdc8d8SChris Lattner while (bytes_extracted < dst_len && GetBytesLeft ()) 31130fdc8d8SChris Lattner { 31230fdc8d8SChris Lattner dst[bytes_extracted] = GetHexU8 (fail_fill_value); 31330fdc8d8SChris Lattner if (IsGood()) 31430fdc8d8SChris Lattner ++bytes_extracted; 31530fdc8d8SChris Lattner else 31630fdc8d8SChris Lattner break; 31730fdc8d8SChris Lattner } 31830fdc8d8SChris Lattner 31930fdc8d8SChris Lattner for (size_t i = bytes_extracted; i < dst_len; ++i) 32030fdc8d8SChris Lattner dst[i] = fail_fill_value; 32130fdc8d8SChris Lattner 32230fdc8d8SChris Lattner return bytes_extracted; 32330fdc8d8SChris Lattner } 32430fdc8d8SChris Lattner 32530fdc8d8SChris Lattner 32630fdc8d8SChris Lattner // Consume ASCII hex nibble character pairs until we have decoded byte_size 32730fdc8d8SChris Lattner // bytes of data. 32830fdc8d8SChris Lattner 32930fdc8d8SChris Lattner uint64_t 33030fdc8d8SChris Lattner StringExtractor::GetHexWithFixedSize (uint32_t byte_size, bool little_endian, uint64_t fail_value) 33130fdc8d8SChris Lattner { 33230fdc8d8SChris Lattner if (byte_size <= 8 && GetBytesLeft() >= byte_size * 2) 33330fdc8d8SChris Lattner { 33430fdc8d8SChris Lattner uint64_t result = 0; 33530fdc8d8SChris Lattner uint32_t i; 33630fdc8d8SChris Lattner if (little_endian) 33730fdc8d8SChris Lattner { 33830fdc8d8SChris Lattner // Little Endian 33930fdc8d8SChris Lattner uint32_t shift_amount; 34030fdc8d8SChris Lattner for (i = 0, shift_amount = 0; 34130fdc8d8SChris Lattner i < byte_size && m_index != UINT32_MAX; 34230fdc8d8SChris Lattner ++i, shift_amount += 8) 34330fdc8d8SChris Lattner { 34430fdc8d8SChris Lattner result |= ((uint64_t)GetHexU8() << shift_amount); 34530fdc8d8SChris Lattner } 34630fdc8d8SChris Lattner } 34730fdc8d8SChris Lattner else 34830fdc8d8SChris Lattner { 34930fdc8d8SChris Lattner // Big Endian 35030fdc8d8SChris Lattner for (i = 0; i < byte_size && m_index != UINT32_MAX; ++i) 35130fdc8d8SChris Lattner { 35230fdc8d8SChris Lattner result <<= 8; 35330fdc8d8SChris Lattner result |= GetHexU8(); 35430fdc8d8SChris Lattner } 35530fdc8d8SChris Lattner } 35630fdc8d8SChris Lattner } 35730fdc8d8SChris Lattner m_index = UINT32_MAX; 35830fdc8d8SChris Lattner return fail_value; 35930fdc8d8SChris Lattner } 36030fdc8d8SChris Lattner 361de9d0494SGreg Clayton size_t 362de9d0494SGreg Clayton StringExtractor::GetHexByteString (std::string &str) 363de9d0494SGreg Clayton { 364de9d0494SGreg Clayton str.clear(); 365de9d0494SGreg Clayton char ch; 366de9d0494SGreg Clayton while ((ch = GetHexU8()) != '\0') 367de9d0494SGreg Clayton str.append(1, ch); 368de9d0494SGreg Clayton return str.size(); 369de9d0494SGreg Clayton } 370de9d0494SGreg Clayton 37130fdc8d8SChris Lattner bool 37230fdc8d8SChris Lattner StringExtractor::GetNameColonValue (std::string &name, std::string &value) 37330fdc8d8SChris Lattner { 37430fdc8d8SChris Lattner // Read something in the form of NNNN:VVVV; where NNNN is any character 37530fdc8d8SChris Lattner // that is not a colon, followed by a ':' character, then a value (one or 37630fdc8d8SChris Lattner // more ';' chars), followed by a ';' 37730fdc8d8SChris Lattner if (m_index < m_packet.size()) 37830fdc8d8SChris Lattner { 37930fdc8d8SChris Lattner const size_t colon_idx = m_packet.find (':', m_index); 38030fdc8d8SChris Lattner if (colon_idx != std::string::npos) 38130fdc8d8SChris Lattner { 38230fdc8d8SChris Lattner const size_t semicolon_idx = m_packet.find (';', colon_idx); 38330fdc8d8SChris Lattner if (semicolon_idx != std::string::npos) 38430fdc8d8SChris Lattner { 38530fdc8d8SChris Lattner name.assign (m_packet, m_index, colon_idx - m_index); 38630fdc8d8SChris Lattner value.assign (m_packet, colon_idx + 1, semicolon_idx - (colon_idx + 1)); 38730fdc8d8SChris Lattner m_index = semicolon_idx + 1; 38830fdc8d8SChris Lattner return true; 38930fdc8d8SChris Lattner } 39030fdc8d8SChris Lattner } 39130fdc8d8SChris Lattner } 39230fdc8d8SChris Lattner m_index = UINT32_MAX; 39330fdc8d8SChris Lattner return false; 39430fdc8d8SChris Lattner } 395