130fdc8d8SChris Lattner //===-- StringExtractor.cpp -------------------------------------*- C++ -*-===// 230fdc8d8SChris Lattner // 330fdc8d8SChris Lattner // The LLVM Compiler Infrastructure 430fdc8d8SChris Lattner // 530fdc8d8SChris Lattner // This file is distributed under the University of Illinois Open Source 630fdc8d8SChris Lattner // License. See LICENSE.TXT for details. 730fdc8d8SChris Lattner // 830fdc8d8SChris Lattner //===----------------------------------------------------------------------===// 930fdc8d8SChris Lattner 10c982c768SGreg Clayton #include "Utility/StringExtractor.h" 1130fdc8d8SChris Lattner 1230fdc8d8SChris Lattner // C Includes 1330fdc8d8SChris Lattner // C++ Includes 1430fdc8d8SChris Lattner // Other libraries and framework includes 1530fdc8d8SChris Lattner // Project includes 1630fdc8d8SChris Lattner 1730fdc8d8SChris Lattner static inline int 1830fdc8d8SChris Lattner xdigit_to_sint (char ch) 1930fdc8d8SChris Lattner { 2030fdc8d8SChris Lattner if (ch >= 'a' && ch <= 'f') 2130fdc8d8SChris Lattner return 10 + ch - 'a'; 221e89cd80SBenjamin Kramer if (ch >= 'A' && ch <= 'F') 231e89cd80SBenjamin Kramer return 10 + ch - 'A'; 2430fdc8d8SChris Lattner return ch - '0'; 2530fdc8d8SChris Lattner } 2630fdc8d8SChris Lattner 2730fdc8d8SChris Lattner static inline unsigned int 2830fdc8d8SChris Lattner xdigit_to_uint (uint8_t ch) 2930fdc8d8SChris Lattner { 3030fdc8d8SChris Lattner if (ch >= 'a' && ch <= 'f') 3130fdc8d8SChris Lattner return 10u + ch - 'a'; 321e89cd80SBenjamin Kramer if (ch >= 'A' && ch <= 'F') 331e89cd80SBenjamin Kramer return 10u + ch - 'A'; 3430fdc8d8SChris Lattner return ch - '0'; 3530fdc8d8SChris Lattner } 3630fdc8d8SChris Lattner 3730fdc8d8SChris Lattner //---------------------------------------------------------------------- 3830fdc8d8SChris Lattner // StringExtractor constructor 3930fdc8d8SChris Lattner //---------------------------------------------------------------------- 4030fdc8d8SChris Lattner StringExtractor::StringExtractor() : 4130fdc8d8SChris Lattner m_packet(), 4230fdc8d8SChris Lattner m_index (0) 4330fdc8d8SChris Lattner { 4430fdc8d8SChris Lattner } 4530fdc8d8SChris Lattner 4630fdc8d8SChris Lattner 4730fdc8d8SChris Lattner StringExtractor::StringExtractor(const char *packet_cstr) : 4830fdc8d8SChris Lattner m_packet(), 4930fdc8d8SChris Lattner m_index (0) 5030fdc8d8SChris Lattner { 5130fdc8d8SChris Lattner if (packet_cstr) 5230fdc8d8SChris Lattner m_packet.assign (packet_cstr); 5330fdc8d8SChris Lattner } 5430fdc8d8SChris Lattner 5530fdc8d8SChris Lattner 5630fdc8d8SChris Lattner //---------------------------------------------------------------------- 5730fdc8d8SChris Lattner // StringExtractor copy constructor 5830fdc8d8SChris Lattner //---------------------------------------------------------------------- 5930fdc8d8SChris Lattner StringExtractor::StringExtractor(const StringExtractor& rhs) : 6030fdc8d8SChris Lattner m_packet (rhs.m_packet), 6130fdc8d8SChris Lattner m_index (rhs.m_index) 6230fdc8d8SChris Lattner { 6330fdc8d8SChris Lattner 6430fdc8d8SChris Lattner } 6530fdc8d8SChris Lattner 6630fdc8d8SChris Lattner //---------------------------------------------------------------------- 6730fdc8d8SChris Lattner // StringExtractor assignment operator 6830fdc8d8SChris Lattner //---------------------------------------------------------------------- 6930fdc8d8SChris Lattner const StringExtractor& 7030fdc8d8SChris Lattner StringExtractor::operator=(const StringExtractor& rhs) 7130fdc8d8SChris Lattner { 7230fdc8d8SChris Lattner if (this != &rhs) 7330fdc8d8SChris Lattner { 7430fdc8d8SChris Lattner m_packet = rhs.m_packet; 7530fdc8d8SChris Lattner m_index = rhs.m_index; 7630fdc8d8SChris Lattner 7730fdc8d8SChris Lattner } 7830fdc8d8SChris Lattner return *this; 7930fdc8d8SChris Lattner } 8030fdc8d8SChris Lattner 8130fdc8d8SChris Lattner //---------------------------------------------------------------------- 8230fdc8d8SChris Lattner // Destructor 8330fdc8d8SChris Lattner //---------------------------------------------------------------------- 8430fdc8d8SChris Lattner StringExtractor::~StringExtractor() 8530fdc8d8SChris Lattner { 8630fdc8d8SChris Lattner } 8730fdc8d8SChris Lattner 8830fdc8d8SChris Lattner 8930fdc8d8SChris Lattner char 9030fdc8d8SChris Lattner StringExtractor::GetChar (char fail_value) 9130fdc8d8SChris Lattner { 9230fdc8d8SChris Lattner if (m_index < m_packet.size()) 9330fdc8d8SChris Lattner { 9430fdc8d8SChris Lattner char ch = m_packet[m_index]; 9530fdc8d8SChris Lattner ++m_index; 9630fdc8d8SChris Lattner return ch; 9730fdc8d8SChris Lattner } 9830fdc8d8SChris Lattner m_index = UINT32_MAX; 9930fdc8d8SChris Lattner return fail_value; 10030fdc8d8SChris Lattner } 10130fdc8d8SChris Lattner 10230fdc8d8SChris Lattner uint32_t 10330fdc8d8SChris Lattner StringExtractor::GetNumHexASCIICharsAtFilePos (uint32_t max) const 10430fdc8d8SChris Lattner { 10530fdc8d8SChris Lattner uint32_t idx = m_index; 10630fdc8d8SChris Lattner const size_t size = m_packet.size(); 10730fdc8d8SChris Lattner while (idx < size && idx - m_index < max && isxdigit(m_packet[idx])) 10830fdc8d8SChris Lattner ++idx; 10930fdc8d8SChris Lattner return idx - m_index; 11030fdc8d8SChris Lattner } 11130fdc8d8SChris Lattner //---------------------------------------------------------------------- 11230fdc8d8SChris Lattner // Extract a signed character from two hex ASCII chars in the packet 11330fdc8d8SChris Lattner // string 11430fdc8d8SChris Lattner //---------------------------------------------------------------------- 11530fdc8d8SChris Lattner int8_t 11630fdc8d8SChris Lattner StringExtractor::GetHexS8 (int8_t fail_value) 11730fdc8d8SChris Lattner { 11830fdc8d8SChris Lattner if (GetNumHexASCIICharsAtFilePos(2)) 11930fdc8d8SChris Lattner { 12030fdc8d8SChris Lattner char hi_nibble_char = m_packet[m_index]; 12130fdc8d8SChris Lattner char lo_nibble_char = m_packet[m_index+1]; 12230fdc8d8SChris Lattner 12330fdc8d8SChris Lattner if (isxdigit(hi_nibble_char) && isxdigit(lo_nibble_char)) 12430fdc8d8SChris Lattner { 12530fdc8d8SChris Lattner char hi_nibble = xdigit_to_sint (hi_nibble_char); 12630fdc8d8SChris Lattner char lo_nibble = xdigit_to_sint (lo_nibble_char); 12730fdc8d8SChris Lattner m_index += 2; 12830fdc8d8SChris Lattner return (hi_nibble << 4) + lo_nibble; 12930fdc8d8SChris Lattner } 13030fdc8d8SChris Lattner } 13130fdc8d8SChris Lattner m_index = UINT32_MAX; 13230fdc8d8SChris Lattner return fail_value; 13330fdc8d8SChris Lattner } 13430fdc8d8SChris Lattner 13530fdc8d8SChris Lattner //---------------------------------------------------------------------- 13630fdc8d8SChris Lattner // Extract an unsigned character from two hex ASCII chars in the packet 13730fdc8d8SChris Lattner // string 13830fdc8d8SChris Lattner //---------------------------------------------------------------------- 13930fdc8d8SChris Lattner uint8_t 14030fdc8d8SChris Lattner StringExtractor::GetHexU8 (uint8_t fail_value) 14130fdc8d8SChris Lattner { 14230fdc8d8SChris Lattner if (GetNumHexASCIICharsAtFilePos(2)) 14330fdc8d8SChris Lattner { 14430fdc8d8SChris Lattner uint8_t hi_nibble_char = m_packet[m_index]; 14530fdc8d8SChris Lattner uint8_t lo_nibble_char = m_packet[m_index+1]; 14630fdc8d8SChris Lattner 14730fdc8d8SChris Lattner if (isxdigit(hi_nibble_char) && isxdigit(lo_nibble_char)) 14830fdc8d8SChris Lattner { 14971337622SGreg Clayton uint8_t hi_nibble = xdigit_to_uint (hi_nibble_char); 15071337622SGreg Clayton uint8_t lo_nibble = xdigit_to_uint (lo_nibble_char); 15130fdc8d8SChris Lattner m_index += 2; 15230fdc8d8SChris Lattner return (hi_nibble << 4) + lo_nibble; 15330fdc8d8SChris Lattner } 15430fdc8d8SChris Lattner } 15530fdc8d8SChris Lattner m_index = UINT32_MAX; 15630fdc8d8SChris Lattner return fail_value; 15730fdc8d8SChris Lattner } 15830fdc8d8SChris Lattner 15930fdc8d8SChris Lattner uint32_t 160*32e0a750SGreg Clayton StringExtractor::GetU32 (uint32_t fail_value, int base) 161*32e0a750SGreg Clayton { 162*32e0a750SGreg Clayton if (m_index < m_packet.size()) 163*32e0a750SGreg Clayton { 164*32e0a750SGreg Clayton char *end = NULL; 165*32e0a750SGreg Clayton const char *start = m_packet.c_str(); 166*32e0a750SGreg Clayton const char *uint_cstr = start + m_index; 167*32e0a750SGreg Clayton uint32_t result = ::strtoul (uint_cstr, &end, base); 168*32e0a750SGreg Clayton 169*32e0a750SGreg Clayton if (end && end != uint_cstr) 170*32e0a750SGreg Clayton { 171*32e0a750SGreg Clayton m_index = end - start; 172*32e0a750SGreg Clayton return result; 173*32e0a750SGreg Clayton } 174*32e0a750SGreg Clayton } 175*32e0a750SGreg Clayton return fail_value; 176*32e0a750SGreg Clayton } 177*32e0a750SGreg Clayton 178*32e0a750SGreg Clayton 179*32e0a750SGreg Clayton uint32_t 18030fdc8d8SChris Lattner StringExtractor::GetHexMaxU32 (bool little_endian, uint32_t fail_value) 18130fdc8d8SChris Lattner { 18230fdc8d8SChris Lattner uint32_t result = 0; 18330fdc8d8SChris Lattner uint32_t nibble_count = 0; 18430fdc8d8SChris Lattner 18530fdc8d8SChris Lattner if (little_endian) 18630fdc8d8SChris Lattner { 18730fdc8d8SChris Lattner uint32_t shift_amount = 0; 18830fdc8d8SChris Lattner while (m_index < m_packet.size() && ::isxdigit (m_packet[m_index])) 18930fdc8d8SChris Lattner { 19030fdc8d8SChris Lattner // Make sure we don't exceed the size of a uint32_t... 19130fdc8d8SChris Lattner if (nibble_count >= (sizeof(uint32_t) * 2)) 19230fdc8d8SChris Lattner { 19330fdc8d8SChris Lattner m_index = UINT32_MAX; 19430fdc8d8SChris Lattner return fail_value; 19530fdc8d8SChris Lattner } 19630fdc8d8SChris Lattner 19730fdc8d8SChris Lattner uint8_t nibble_lo; 19830fdc8d8SChris Lattner uint8_t nibble_hi = xdigit_to_sint (m_packet[m_index]); 19930fdc8d8SChris Lattner ++m_index; 20030fdc8d8SChris Lattner if (m_index < m_packet.size() && ::isxdigit (m_packet[m_index])) 20130fdc8d8SChris Lattner { 20230fdc8d8SChris Lattner nibble_lo = xdigit_to_sint (m_packet[m_index]); 20330fdc8d8SChris Lattner ++m_index; 20430fdc8d8SChris Lattner result |= ((uint32_t)nibble_hi << (shift_amount + 4)); 20530fdc8d8SChris Lattner result |= ((uint32_t)nibble_lo << shift_amount); 20630fdc8d8SChris Lattner nibble_count += 2; 20730fdc8d8SChris Lattner shift_amount += 8; 20830fdc8d8SChris Lattner } 20930fdc8d8SChris Lattner else 21030fdc8d8SChris Lattner { 21130fdc8d8SChris Lattner result |= ((uint32_t)nibble_hi << shift_amount); 21230fdc8d8SChris Lattner nibble_count += 1; 21330fdc8d8SChris Lattner shift_amount += 4; 21430fdc8d8SChris Lattner } 21530fdc8d8SChris Lattner 21630fdc8d8SChris Lattner } 21730fdc8d8SChris Lattner } 21830fdc8d8SChris Lattner else 21930fdc8d8SChris Lattner { 22030fdc8d8SChris Lattner while (m_index < m_packet.size() && ::isxdigit (m_packet[m_index])) 22130fdc8d8SChris Lattner { 22230fdc8d8SChris Lattner // Make sure we don't exceed the size of a uint32_t... 22330fdc8d8SChris Lattner if (nibble_count >= (sizeof(uint32_t) * 2)) 22430fdc8d8SChris Lattner { 22530fdc8d8SChris Lattner m_index = UINT32_MAX; 22630fdc8d8SChris Lattner return fail_value; 22730fdc8d8SChris Lattner } 22830fdc8d8SChris Lattner 22930fdc8d8SChris Lattner uint8_t nibble = xdigit_to_sint (m_packet[m_index]); 23030fdc8d8SChris Lattner // Big Endian 23130fdc8d8SChris Lattner result <<= 4; 23230fdc8d8SChris Lattner result |= nibble; 23330fdc8d8SChris Lattner 23430fdc8d8SChris Lattner ++m_index; 23530fdc8d8SChris Lattner ++nibble_count; 23630fdc8d8SChris Lattner } 23730fdc8d8SChris Lattner } 23830fdc8d8SChris Lattner return result; 23930fdc8d8SChris Lattner } 24030fdc8d8SChris Lattner 24130fdc8d8SChris Lattner uint64_t 24230fdc8d8SChris Lattner StringExtractor::GetHexMaxU64 (bool little_endian, uint64_t fail_value) 24330fdc8d8SChris Lattner { 24430fdc8d8SChris Lattner uint64_t result = 0; 24530fdc8d8SChris Lattner uint32_t nibble_count = 0; 24630fdc8d8SChris Lattner 24730fdc8d8SChris Lattner if (little_endian) 24830fdc8d8SChris Lattner { 24930fdc8d8SChris Lattner uint32_t shift_amount = 0; 25030fdc8d8SChris Lattner while (m_index < m_packet.size() && ::isxdigit (m_packet[m_index])) 25130fdc8d8SChris Lattner { 25230fdc8d8SChris Lattner // Make sure we don't exceed the size of a uint64_t... 25330fdc8d8SChris Lattner if (nibble_count >= (sizeof(uint64_t) * 2)) 25430fdc8d8SChris Lattner { 25530fdc8d8SChris Lattner m_index = UINT32_MAX; 25630fdc8d8SChris Lattner return fail_value; 25730fdc8d8SChris Lattner } 25830fdc8d8SChris Lattner 25930fdc8d8SChris Lattner uint8_t nibble_lo; 26030fdc8d8SChris Lattner uint8_t nibble_hi = xdigit_to_sint (m_packet[m_index]); 26130fdc8d8SChris Lattner ++m_index; 26230fdc8d8SChris Lattner if (m_index < m_packet.size() && ::isxdigit (m_packet[m_index])) 26330fdc8d8SChris Lattner { 26430fdc8d8SChris Lattner nibble_lo = xdigit_to_sint (m_packet[m_index]); 26530fdc8d8SChris Lattner ++m_index; 26630fdc8d8SChris Lattner result |= ((uint64_t)nibble_hi << (shift_amount + 4)); 26730fdc8d8SChris Lattner result |= ((uint64_t)nibble_lo << shift_amount); 26830fdc8d8SChris Lattner nibble_count += 2; 26930fdc8d8SChris Lattner shift_amount += 8; 27030fdc8d8SChris Lattner } 27130fdc8d8SChris Lattner else 27230fdc8d8SChris Lattner { 27330fdc8d8SChris Lattner result |= ((uint64_t)nibble_hi << shift_amount); 27430fdc8d8SChris Lattner nibble_count += 1; 27530fdc8d8SChris Lattner shift_amount += 4; 27630fdc8d8SChris Lattner } 27730fdc8d8SChris Lattner 27830fdc8d8SChris Lattner } 27930fdc8d8SChris Lattner } 28030fdc8d8SChris Lattner else 28130fdc8d8SChris Lattner { 28230fdc8d8SChris Lattner while (m_index < m_packet.size() && ::isxdigit (m_packet[m_index])) 28330fdc8d8SChris Lattner { 28430fdc8d8SChris Lattner // Make sure we don't exceed the size of a uint64_t... 28530fdc8d8SChris Lattner if (nibble_count >= (sizeof(uint64_t) * 2)) 28630fdc8d8SChris Lattner { 28730fdc8d8SChris Lattner m_index = UINT32_MAX; 28830fdc8d8SChris Lattner return fail_value; 28930fdc8d8SChris Lattner } 29030fdc8d8SChris Lattner 29130fdc8d8SChris Lattner uint8_t nibble = xdigit_to_sint (m_packet[m_index]); 29230fdc8d8SChris Lattner // Big Endian 29330fdc8d8SChris Lattner result <<= 4; 29430fdc8d8SChris Lattner result |= nibble; 29530fdc8d8SChris Lattner 29630fdc8d8SChris Lattner ++m_index; 29730fdc8d8SChris Lattner ++nibble_count; 29830fdc8d8SChris Lattner } 29930fdc8d8SChris Lattner } 30030fdc8d8SChris Lattner return result; 30130fdc8d8SChris Lattner } 30230fdc8d8SChris Lattner 30330fdc8d8SChris Lattner size_t 30430fdc8d8SChris Lattner StringExtractor::GetHexBytes (void *dst_void, size_t dst_len, uint8_t fail_fill_value) 30530fdc8d8SChris Lattner { 30630fdc8d8SChris Lattner uint8_t *dst = (uint8_t*)dst_void; 30730fdc8d8SChris Lattner size_t bytes_extracted = 0; 30830fdc8d8SChris Lattner while (bytes_extracted < dst_len && GetBytesLeft ()) 30930fdc8d8SChris Lattner { 31030fdc8d8SChris Lattner dst[bytes_extracted] = GetHexU8 (fail_fill_value); 31130fdc8d8SChris Lattner if (IsGood()) 31230fdc8d8SChris Lattner ++bytes_extracted; 31330fdc8d8SChris Lattner else 31430fdc8d8SChris Lattner break; 31530fdc8d8SChris Lattner } 31630fdc8d8SChris Lattner 31730fdc8d8SChris Lattner for (size_t i = bytes_extracted; i < dst_len; ++i) 31830fdc8d8SChris Lattner dst[i] = fail_fill_value; 31930fdc8d8SChris Lattner 32030fdc8d8SChris Lattner return bytes_extracted; 32130fdc8d8SChris Lattner } 32230fdc8d8SChris Lattner 32330fdc8d8SChris Lattner 32430fdc8d8SChris Lattner // Consume ASCII hex nibble character pairs until we have decoded byte_size 32530fdc8d8SChris Lattner // bytes of data. 32630fdc8d8SChris Lattner 32730fdc8d8SChris Lattner uint64_t 32830fdc8d8SChris Lattner StringExtractor::GetHexWithFixedSize (uint32_t byte_size, bool little_endian, uint64_t fail_value) 32930fdc8d8SChris Lattner { 33030fdc8d8SChris Lattner if (byte_size <= 8 && GetBytesLeft() >= byte_size * 2) 33130fdc8d8SChris Lattner { 33230fdc8d8SChris Lattner uint64_t result = 0; 33330fdc8d8SChris Lattner uint32_t i; 33430fdc8d8SChris Lattner if (little_endian) 33530fdc8d8SChris Lattner { 33630fdc8d8SChris Lattner // Little Endian 33730fdc8d8SChris Lattner uint32_t shift_amount; 33830fdc8d8SChris Lattner for (i = 0, shift_amount = 0; 33930fdc8d8SChris Lattner i < byte_size && m_index != UINT32_MAX; 34030fdc8d8SChris Lattner ++i, shift_amount += 8) 34130fdc8d8SChris Lattner { 34230fdc8d8SChris Lattner result |= ((uint64_t)GetHexU8() << shift_amount); 34330fdc8d8SChris Lattner } 34430fdc8d8SChris Lattner } 34530fdc8d8SChris Lattner else 34630fdc8d8SChris Lattner { 34730fdc8d8SChris Lattner // Big Endian 34830fdc8d8SChris Lattner for (i = 0; i < byte_size && m_index != UINT32_MAX; ++i) 34930fdc8d8SChris Lattner { 35030fdc8d8SChris Lattner result <<= 8; 35130fdc8d8SChris Lattner result |= GetHexU8(); 35230fdc8d8SChris Lattner } 35330fdc8d8SChris Lattner } 35430fdc8d8SChris Lattner } 35530fdc8d8SChris Lattner m_index = UINT32_MAX; 35630fdc8d8SChris Lattner return fail_value; 35730fdc8d8SChris Lattner } 35830fdc8d8SChris Lattner 359de9d0494SGreg Clayton size_t 360de9d0494SGreg Clayton StringExtractor::GetHexByteString (std::string &str) 361de9d0494SGreg Clayton { 362de9d0494SGreg Clayton str.clear(); 363de9d0494SGreg Clayton char ch; 364de9d0494SGreg Clayton while ((ch = GetHexU8()) != '\0') 365de9d0494SGreg Clayton str.append(1, ch); 366de9d0494SGreg Clayton return str.size(); 367de9d0494SGreg Clayton } 368de9d0494SGreg Clayton 36930fdc8d8SChris Lattner bool 37030fdc8d8SChris Lattner StringExtractor::GetNameColonValue (std::string &name, std::string &value) 37130fdc8d8SChris Lattner { 37230fdc8d8SChris Lattner // Read something in the form of NNNN:VVVV; where NNNN is any character 37330fdc8d8SChris Lattner // that is not a colon, followed by a ':' character, then a value (one or 37430fdc8d8SChris Lattner // more ';' chars), followed by a ';' 37530fdc8d8SChris Lattner if (m_index < m_packet.size()) 37630fdc8d8SChris Lattner { 37730fdc8d8SChris Lattner const size_t colon_idx = m_packet.find (':', m_index); 37830fdc8d8SChris Lattner if (colon_idx != std::string::npos) 37930fdc8d8SChris Lattner { 38030fdc8d8SChris Lattner const size_t semicolon_idx = m_packet.find (';', colon_idx); 38130fdc8d8SChris Lattner if (semicolon_idx != std::string::npos) 38230fdc8d8SChris Lattner { 38330fdc8d8SChris Lattner name.assign (m_packet, m_index, colon_idx - m_index); 38430fdc8d8SChris Lattner value.assign (m_packet, colon_idx + 1, semicolon_idx - (colon_idx + 1)); 38530fdc8d8SChris Lattner m_index = semicolon_idx + 1; 38630fdc8d8SChris Lattner return true; 38730fdc8d8SChris Lattner } 38830fdc8d8SChris Lattner } 38930fdc8d8SChris Lattner } 39030fdc8d8SChris Lattner m_index = UINT32_MAX; 39130fdc8d8SChris Lattner return false; 39230fdc8d8SChris Lattner } 393