130fdc8d8SChris Lattner //===-- StringExtractor.cpp -------------------------------------*- C++ -*-===// 230fdc8d8SChris Lattner // 330fdc8d8SChris Lattner // The LLVM Compiler Infrastructure 430fdc8d8SChris Lattner // 530fdc8d8SChris Lattner // This file is distributed under the University of Illinois Open Source 630fdc8d8SChris Lattner // License. See LICENSE.TXT for details. 730fdc8d8SChris Lattner // 830fdc8d8SChris Lattner //===----------------------------------------------------------------------===// 930fdc8d8SChris Lattner 10c982c768SGreg Clayton #include "Utility/StringExtractor.h" 1130fdc8d8SChris Lattner 1230fdc8d8SChris Lattner // C Includes 1378709173SStephen Wilson #include <stdlib.h> 1478709173SStephen Wilson 1530fdc8d8SChris Lattner // C++ Includes 1630fdc8d8SChris Lattner // Other libraries and framework includes 1730fdc8d8SChris Lattner // Project includes 1830fdc8d8SChris Lattner 1930fdc8d8SChris Lattner static inline int 2030fdc8d8SChris Lattner xdigit_to_sint (char ch) 2130fdc8d8SChris Lattner { 2230fdc8d8SChris Lattner if (ch >= 'a' && ch <= 'f') 2330fdc8d8SChris Lattner return 10 + ch - 'a'; 241e89cd80SBenjamin Kramer if (ch >= 'A' && ch <= 'F') 251e89cd80SBenjamin Kramer return 10 + ch - 'A'; 2630fdc8d8SChris Lattner return ch - '0'; 2730fdc8d8SChris Lattner } 2830fdc8d8SChris Lattner 2930fdc8d8SChris Lattner static inline unsigned int 3030fdc8d8SChris Lattner xdigit_to_uint (uint8_t ch) 3130fdc8d8SChris Lattner { 3230fdc8d8SChris Lattner if (ch >= 'a' && ch <= 'f') 3330fdc8d8SChris Lattner return 10u + ch - 'a'; 341e89cd80SBenjamin Kramer if (ch >= 'A' && ch <= 'F') 351e89cd80SBenjamin Kramer return 10u + ch - 'A'; 3630fdc8d8SChris Lattner return ch - '0'; 3730fdc8d8SChris Lattner } 3830fdc8d8SChris Lattner 3930fdc8d8SChris Lattner //---------------------------------------------------------------------- 4030fdc8d8SChris Lattner // StringExtractor constructor 4130fdc8d8SChris Lattner //---------------------------------------------------------------------- 4230fdc8d8SChris Lattner StringExtractor::StringExtractor() : 4330fdc8d8SChris Lattner m_packet(), 4430fdc8d8SChris Lattner m_index (0) 4530fdc8d8SChris Lattner { 4630fdc8d8SChris Lattner } 4730fdc8d8SChris Lattner 4830fdc8d8SChris Lattner 4930fdc8d8SChris Lattner StringExtractor::StringExtractor(const char *packet_cstr) : 5030fdc8d8SChris Lattner m_packet(), 5130fdc8d8SChris Lattner m_index (0) 5230fdc8d8SChris Lattner { 5330fdc8d8SChris Lattner if (packet_cstr) 5430fdc8d8SChris Lattner m_packet.assign (packet_cstr); 5530fdc8d8SChris Lattner } 5630fdc8d8SChris Lattner 5730fdc8d8SChris Lattner 5830fdc8d8SChris Lattner //---------------------------------------------------------------------- 5930fdc8d8SChris Lattner // StringExtractor copy constructor 6030fdc8d8SChris Lattner //---------------------------------------------------------------------- 6130fdc8d8SChris Lattner StringExtractor::StringExtractor(const StringExtractor& rhs) : 6230fdc8d8SChris Lattner m_packet (rhs.m_packet), 6330fdc8d8SChris Lattner m_index (rhs.m_index) 6430fdc8d8SChris Lattner { 6530fdc8d8SChris Lattner 6630fdc8d8SChris Lattner } 6730fdc8d8SChris Lattner 6830fdc8d8SChris Lattner //---------------------------------------------------------------------- 6930fdc8d8SChris Lattner // StringExtractor assignment operator 7030fdc8d8SChris Lattner //---------------------------------------------------------------------- 7130fdc8d8SChris Lattner const StringExtractor& 7230fdc8d8SChris Lattner StringExtractor::operator=(const StringExtractor& rhs) 7330fdc8d8SChris Lattner { 7430fdc8d8SChris Lattner if (this != &rhs) 7530fdc8d8SChris Lattner { 7630fdc8d8SChris Lattner m_packet = rhs.m_packet; 7730fdc8d8SChris Lattner m_index = rhs.m_index; 7830fdc8d8SChris Lattner 7930fdc8d8SChris Lattner } 8030fdc8d8SChris Lattner return *this; 8130fdc8d8SChris Lattner } 8230fdc8d8SChris Lattner 8330fdc8d8SChris Lattner //---------------------------------------------------------------------- 8430fdc8d8SChris Lattner // Destructor 8530fdc8d8SChris Lattner //---------------------------------------------------------------------- 8630fdc8d8SChris Lattner StringExtractor::~StringExtractor() 8730fdc8d8SChris Lattner { 8830fdc8d8SChris Lattner } 8930fdc8d8SChris Lattner 9030fdc8d8SChris Lattner 9130fdc8d8SChris Lattner char 9230fdc8d8SChris Lattner StringExtractor::GetChar (char fail_value) 9330fdc8d8SChris Lattner { 9430fdc8d8SChris Lattner if (m_index < m_packet.size()) 9530fdc8d8SChris Lattner { 9630fdc8d8SChris Lattner char ch = m_packet[m_index]; 9730fdc8d8SChris Lattner ++m_index; 9830fdc8d8SChris Lattner return ch; 9930fdc8d8SChris Lattner } 10030fdc8d8SChris Lattner m_index = UINT32_MAX; 10130fdc8d8SChris Lattner return fail_value; 10230fdc8d8SChris Lattner } 10330fdc8d8SChris Lattner 10430fdc8d8SChris Lattner uint32_t 10530fdc8d8SChris Lattner StringExtractor::GetNumHexASCIICharsAtFilePos (uint32_t max) const 10630fdc8d8SChris Lattner { 10730fdc8d8SChris Lattner uint32_t idx = m_index; 10830fdc8d8SChris Lattner const size_t size = m_packet.size(); 10930fdc8d8SChris Lattner while (idx < size && idx - m_index < max && isxdigit(m_packet[idx])) 11030fdc8d8SChris Lattner ++idx; 11130fdc8d8SChris Lattner return idx - m_index; 11230fdc8d8SChris Lattner } 11330fdc8d8SChris Lattner //---------------------------------------------------------------------- 11430fdc8d8SChris Lattner // Extract a signed character from two hex ASCII chars in the packet 11530fdc8d8SChris Lattner // string 11630fdc8d8SChris Lattner //---------------------------------------------------------------------- 11730fdc8d8SChris Lattner int8_t 11830fdc8d8SChris Lattner StringExtractor::GetHexS8 (int8_t fail_value) 11930fdc8d8SChris Lattner { 12030fdc8d8SChris Lattner if (GetNumHexASCIICharsAtFilePos(2)) 12130fdc8d8SChris Lattner { 12230fdc8d8SChris Lattner char hi_nibble_char = m_packet[m_index]; 12330fdc8d8SChris Lattner char lo_nibble_char = m_packet[m_index+1]; 12430fdc8d8SChris Lattner char hi_nibble = xdigit_to_sint (hi_nibble_char); 12530fdc8d8SChris Lattner char lo_nibble = xdigit_to_sint (lo_nibble_char); 12630fdc8d8SChris Lattner m_index += 2; 12730fdc8d8SChris Lattner return (hi_nibble << 4) + lo_nibble; 12830fdc8d8SChris Lattner } 12930fdc8d8SChris Lattner m_index = UINT32_MAX; 13030fdc8d8SChris Lattner return fail_value; 13130fdc8d8SChris Lattner } 13230fdc8d8SChris Lattner 13330fdc8d8SChris Lattner //---------------------------------------------------------------------- 13430fdc8d8SChris Lattner // Extract an unsigned character from two hex ASCII chars in the packet 13530fdc8d8SChris Lattner // string 13630fdc8d8SChris Lattner //---------------------------------------------------------------------- 13730fdc8d8SChris Lattner uint8_t 138*7b70be39SGreg Clayton StringExtractor::GetHexU8 (uint8_t fail_value, bool set_eof_on_fail) 13930fdc8d8SChris Lattner { 14030fdc8d8SChris Lattner if (GetNumHexASCIICharsAtFilePos(2)) 14130fdc8d8SChris Lattner { 14230fdc8d8SChris Lattner uint8_t hi_nibble_char = m_packet[m_index]; 14330fdc8d8SChris Lattner uint8_t lo_nibble_char = m_packet[m_index+1]; 14471337622SGreg Clayton uint8_t hi_nibble = xdigit_to_uint (hi_nibble_char); 14571337622SGreg Clayton uint8_t lo_nibble = xdigit_to_uint (lo_nibble_char); 14630fdc8d8SChris Lattner m_index += 2; 14730fdc8d8SChris Lattner return (hi_nibble << 4) + lo_nibble; 14830fdc8d8SChris Lattner } 149*7b70be39SGreg Clayton if (set_eof_on_fail || m_index >= m_packet.size()) 15030fdc8d8SChris Lattner m_index = UINT32_MAX; 15130fdc8d8SChris Lattner return fail_value; 15230fdc8d8SChris Lattner } 15330fdc8d8SChris Lattner 15430fdc8d8SChris Lattner uint32_t 15532e0a750SGreg Clayton StringExtractor::GetU32 (uint32_t fail_value, int base) 15632e0a750SGreg Clayton { 15732e0a750SGreg Clayton if (m_index < m_packet.size()) 15832e0a750SGreg Clayton { 15932e0a750SGreg Clayton char *end = NULL; 16032e0a750SGreg Clayton const char *start = m_packet.c_str(); 16132e0a750SGreg Clayton const char *uint_cstr = start + m_index; 16232e0a750SGreg Clayton uint32_t result = ::strtoul (uint_cstr, &end, base); 16332e0a750SGreg Clayton 16432e0a750SGreg Clayton if (end && end != uint_cstr) 16532e0a750SGreg Clayton { 16632e0a750SGreg Clayton m_index = end - start; 16732e0a750SGreg Clayton return result; 16832e0a750SGreg Clayton } 16932e0a750SGreg Clayton } 17032e0a750SGreg Clayton return fail_value; 17132e0a750SGreg Clayton } 17232e0a750SGreg Clayton 17332e0a750SGreg Clayton 17432e0a750SGreg Clayton uint32_t 17530fdc8d8SChris Lattner StringExtractor::GetHexMaxU32 (bool little_endian, uint32_t fail_value) 17630fdc8d8SChris Lattner { 17730fdc8d8SChris Lattner uint32_t result = 0; 17830fdc8d8SChris Lattner uint32_t nibble_count = 0; 17930fdc8d8SChris Lattner 18030fdc8d8SChris Lattner if (little_endian) 18130fdc8d8SChris Lattner { 18230fdc8d8SChris Lattner uint32_t shift_amount = 0; 18330fdc8d8SChris Lattner while (m_index < m_packet.size() && ::isxdigit (m_packet[m_index])) 18430fdc8d8SChris Lattner { 18530fdc8d8SChris Lattner // Make sure we don't exceed the size of a uint32_t... 18630fdc8d8SChris Lattner if (nibble_count >= (sizeof(uint32_t) * 2)) 18730fdc8d8SChris Lattner { 18830fdc8d8SChris Lattner m_index = UINT32_MAX; 18930fdc8d8SChris Lattner return fail_value; 19030fdc8d8SChris Lattner } 19130fdc8d8SChris Lattner 19230fdc8d8SChris Lattner uint8_t nibble_lo; 19330fdc8d8SChris Lattner uint8_t nibble_hi = xdigit_to_sint (m_packet[m_index]); 19430fdc8d8SChris Lattner ++m_index; 19530fdc8d8SChris Lattner if (m_index < m_packet.size() && ::isxdigit (m_packet[m_index])) 19630fdc8d8SChris Lattner { 19730fdc8d8SChris Lattner nibble_lo = xdigit_to_sint (m_packet[m_index]); 19830fdc8d8SChris Lattner ++m_index; 19930fdc8d8SChris Lattner result |= ((uint32_t)nibble_hi << (shift_amount + 4)); 20030fdc8d8SChris Lattner result |= ((uint32_t)nibble_lo << shift_amount); 20130fdc8d8SChris Lattner nibble_count += 2; 20230fdc8d8SChris Lattner shift_amount += 8; 20330fdc8d8SChris Lattner } 20430fdc8d8SChris Lattner else 20530fdc8d8SChris Lattner { 20630fdc8d8SChris Lattner result |= ((uint32_t)nibble_hi << shift_amount); 20730fdc8d8SChris Lattner nibble_count += 1; 20830fdc8d8SChris Lattner shift_amount += 4; 20930fdc8d8SChris Lattner } 21030fdc8d8SChris Lattner 21130fdc8d8SChris Lattner } 21230fdc8d8SChris Lattner } 21330fdc8d8SChris Lattner else 21430fdc8d8SChris Lattner { 21530fdc8d8SChris Lattner while (m_index < m_packet.size() && ::isxdigit (m_packet[m_index])) 21630fdc8d8SChris Lattner { 21730fdc8d8SChris Lattner // Make sure we don't exceed the size of a uint32_t... 21830fdc8d8SChris Lattner if (nibble_count >= (sizeof(uint32_t) * 2)) 21930fdc8d8SChris Lattner { 22030fdc8d8SChris Lattner m_index = UINT32_MAX; 22130fdc8d8SChris Lattner return fail_value; 22230fdc8d8SChris Lattner } 22330fdc8d8SChris Lattner 22430fdc8d8SChris Lattner uint8_t nibble = xdigit_to_sint (m_packet[m_index]); 22530fdc8d8SChris Lattner // Big Endian 22630fdc8d8SChris Lattner result <<= 4; 22730fdc8d8SChris Lattner result |= nibble; 22830fdc8d8SChris Lattner 22930fdc8d8SChris Lattner ++m_index; 23030fdc8d8SChris Lattner ++nibble_count; 23130fdc8d8SChris Lattner } 23230fdc8d8SChris Lattner } 23330fdc8d8SChris Lattner return result; 23430fdc8d8SChris Lattner } 23530fdc8d8SChris Lattner 23630fdc8d8SChris Lattner uint64_t 23730fdc8d8SChris Lattner StringExtractor::GetHexMaxU64 (bool little_endian, uint64_t fail_value) 23830fdc8d8SChris Lattner { 23930fdc8d8SChris Lattner uint64_t result = 0; 24030fdc8d8SChris Lattner uint32_t nibble_count = 0; 24130fdc8d8SChris Lattner 24230fdc8d8SChris Lattner if (little_endian) 24330fdc8d8SChris Lattner { 24430fdc8d8SChris Lattner uint32_t shift_amount = 0; 24530fdc8d8SChris Lattner while (m_index < m_packet.size() && ::isxdigit (m_packet[m_index])) 24630fdc8d8SChris Lattner { 24730fdc8d8SChris Lattner // Make sure we don't exceed the size of a uint64_t... 24830fdc8d8SChris Lattner if (nibble_count >= (sizeof(uint64_t) * 2)) 24930fdc8d8SChris Lattner { 25030fdc8d8SChris Lattner m_index = UINT32_MAX; 25130fdc8d8SChris Lattner return fail_value; 25230fdc8d8SChris Lattner } 25330fdc8d8SChris Lattner 25430fdc8d8SChris Lattner uint8_t nibble_lo; 25530fdc8d8SChris Lattner uint8_t nibble_hi = xdigit_to_sint (m_packet[m_index]); 25630fdc8d8SChris Lattner ++m_index; 25730fdc8d8SChris Lattner if (m_index < m_packet.size() && ::isxdigit (m_packet[m_index])) 25830fdc8d8SChris Lattner { 25930fdc8d8SChris Lattner nibble_lo = xdigit_to_sint (m_packet[m_index]); 26030fdc8d8SChris Lattner ++m_index; 26130fdc8d8SChris Lattner result |= ((uint64_t)nibble_hi << (shift_amount + 4)); 26230fdc8d8SChris Lattner result |= ((uint64_t)nibble_lo << shift_amount); 26330fdc8d8SChris Lattner nibble_count += 2; 26430fdc8d8SChris Lattner shift_amount += 8; 26530fdc8d8SChris Lattner } 26630fdc8d8SChris Lattner else 26730fdc8d8SChris Lattner { 26830fdc8d8SChris Lattner result |= ((uint64_t)nibble_hi << shift_amount); 26930fdc8d8SChris Lattner nibble_count += 1; 27030fdc8d8SChris Lattner shift_amount += 4; 27130fdc8d8SChris Lattner } 27230fdc8d8SChris Lattner 27330fdc8d8SChris Lattner } 27430fdc8d8SChris Lattner } 27530fdc8d8SChris Lattner else 27630fdc8d8SChris Lattner { 27730fdc8d8SChris Lattner while (m_index < m_packet.size() && ::isxdigit (m_packet[m_index])) 27830fdc8d8SChris Lattner { 27930fdc8d8SChris Lattner // Make sure we don't exceed the size of a uint64_t... 28030fdc8d8SChris Lattner if (nibble_count >= (sizeof(uint64_t) * 2)) 28130fdc8d8SChris Lattner { 28230fdc8d8SChris Lattner m_index = UINT32_MAX; 28330fdc8d8SChris Lattner return fail_value; 28430fdc8d8SChris Lattner } 28530fdc8d8SChris Lattner 28630fdc8d8SChris Lattner uint8_t nibble = xdigit_to_sint (m_packet[m_index]); 28730fdc8d8SChris Lattner // Big Endian 28830fdc8d8SChris Lattner result <<= 4; 28930fdc8d8SChris Lattner result |= nibble; 29030fdc8d8SChris Lattner 29130fdc8d8SChris Lattner ++m_index; 29230fdc8d8SChris Lattner ++nibble_count; 29330fdc8d8SChris Lattner } 29430fdc8d8SChris Lattner } 29530fdc8d8SChris Lattner return result; 29630fdc8d8SChris Lattner } 29730fdc8d8SChris Lattner 29830fdc8d8SChris Lattner size_t 29930fdc8d8SChris Lattner StringExtractor::GetHexBytes (void *dst_void, size_t dst_len, uint8_t fail_fill_value) 30030fdc8d8SChris Lattner { 30130fdc8d8SChris Lattner uint8_t *dst = (uint8_t*)dst_void; 30230fdc8d8SChris Lattner size_t bytes_extracted = 0; 30330fdc8d8SChris Lattner while (bytes_extracted < dst_len && GetBytesLeft ()) 30430fdc8d8SChris Lattner { 30530fdc8d8SChris Lattner dst[bytes_extracted] = GetHexU8 (fail_fill_value); 30630fdc8d8SChris Lattner if (IsGood()) 30730fdc8d8SChris Lattner ++bytes_extracted; 30830fdc8d8SChris Lattner else 30930fdc8d8SChris Lattner break; 31030fdc8d8SChris Lattner } 31130fdc8d8SChris Lattner 31230fdc8d8SChris Lattner for (size_t i = bytes_extracted; i < dst_len; ++i) 31330fdc8d8SChris Lattner dst[i] = fail_fill_value; 31430fdc8d8SChris Lattner 31530fdc8d8SChris Lattner return bytes_extracted; 31630fdc8d8SChris Lattner } 31730fdc8d8SChris Lattner 31830fdc8d8SChris Lattner 31930fdc8d8SChris Lattner // Consume ASCII hex nibble character pairs until we have decoded byte_size 32030fdc8d8SChris Lattner // bytes of data. 32130fdc8d8SChris Lattner 32230fdc8d8SChris Lattner uint64_t 32330fdc8d8SChris Lattner StringExtractor::GetHexWithFixedSize (uint32_t byte_size, bool little_endian, uint64_t fail_value) 32430fdc8d8SChris Lattner { 32530fdc8d8SChris Lattner if (byte_size <= 8 && GetBytesLeft() >= byte_size * 2) 32630fdc8d8SChris Lattner { 32730fdc8d8SChris Lattner uint64_t result = 0; 32830fdc8d8SChris Lattner uint32_t i; 32930fdc8d8SChris Lattner if (little_endian) 33030fdc8d8SChris Lattner { 33130fdc8d8SChris Lattner // Little Endian 33230fdc8d8SChris Lattner uint32_t shift_amount; 33330fdc8d8SChris Lattner for (i = 0, shift_amount = 0; 33430fdc8d8SChris Lattner i < byte_size && m_index != UINT32_MAX; 33530fdc8d8SChris Lattner ++i, shift_amount += 8) 33630fdc8d8SChris Lattner { 33730fdc8d8SChris Lattner result |= ((uint64_t)GetHexU8() << shift_amount); 33830fdc8d8SChris Lattner } 33930fdc8d8SChris Lattner } 34030fdc8d8SChris Lattner else 34130fdc8d8SChris Lattner { 34230fdc8d8SChris Lattner // Big Endian 34330fdc8d8SChris Lattner for (i = 0; i < byte_size && m_index != UINT32_MAX; ++i) 34430fdc8d8SChris Lattner { 34530fdc8d8SChris Lattner result <<= 8; 34630fdc8d8SChris Lattner result |= GetHexU8(); 34730fdc8d8SChris Lattner } 34830fdc8d8SChris Lattner } 34930fdc8d8SChris Lattner } 35030fdc8d8SChris Lattner m_index = UINT32_MAX; 35130fdc8d8SChris Lattner return fail_value; 35230fdc8d8SChris Lattner } 35330fdc8d8SChris Lattner 354de9d0494SGreg Clayton size_t 355de9d0494SGreg Clayton StringExtractor::GetHexByteString (std::string &str) 356de9d0494SGreg Clayton { 357de9d0494SGreg Clayton str.clear(); 358de9d0494SGreg Clayton char ch; 359de9d0494SGreg Clayton while ((ch = GetHexU8()) != '\0') 360de9d0494SGreg Clayton str.append(1, ch); 361de9d0494SGreg Clayton return str.size(); 362de9d0494SGreg Clayton } 363de9d0494SGreg Clayton 36430fdc8d8SChris Lattner bool 36530fdc8d8SChris Lattner StringExtractor::GetNameColonValue (std::string &name, std::string &value) 36630fdc8d8SChris Lattner { 36730fdc8d8SChris Lattner // Read something in the form of NNNN:VVVV; where NNNN is any character 36830fdc8d8SChris Lattner // that is not a colon, followed by a ':' character, then a value (one or 36930fdc8d8SChris Lattner // more ';' chars), followed by a ';' 37030fdc8d8SChris Lattner if (m_index < m_packet.size()) 37130fdc8d8SChris Lattner { 37230fdc8d8SChris Lattner const size_t colon_idx = m_packet.find (':', m_index); 37330fdc8d8SChris Lattner if (colon_idx != std::string::npos) 37430fdc8d8SChris Lattner { 37530fdc8d8SChris Lattner const size_t semicolon_idx = m_packet.find (';', colon_idx); 37630fdc8d8SChris Lattner if (semicolon_idx != std::string::npos) 37730fdc8d8SChris Lattner { 37830fdc8d8SChris Lattner name.assign (m_packet, m_index, colon_idx - m_index); 37930fdc8d8SChris Lattner value.assign (m_packet, colon_idx + 1, semicolon_idx - (colon_idx + 1)); 38030fdc8d8SChris Lattner m_index = semicolon_idx + 1; 38130fdc8d8SChris Lattner return true; 38230fdc8d8SChris Lattner } 38330fdc8d8SChris Lattner } 38430fdc8d8SChris Lattner } 38530fdc8d8SChris Lattner m_index = UINT32_MAX; 38630fdc8d8SChris Lattner return false; 38730fdc8d8SChris Lattner } 388