130fdc8d8SChris Lattner //===-- StringExtractor.cpp -------------------------------------*- C++ -*-===// 230fdc8d8SChris Lattner // 330fdc8d8SChris Lattner // The LLVM Compiler Infrastructure 430fdc8d8SChris Lattner // 530fdc8d8SChris Lattner // This file is distributed under the University of Illinois Open Source 630fdc8d8SChris Lattner // License. See LICENSE.TXT for details. 730fdc8d8SChris Lattner // 830fdc8d8SChris Lattner //===----------------------------------------------------------------------===// 930fdc8d8SChris Lattner 1030fdc8d8SChris Lattner #include "StringExtractor.h" 1130fdc8d8SChris Lattner 1230fdc8d8SChris Lattner // C Includes 1330fdc8d8SChris Lattner // C++ Includes 1430fdc8d8SChris Lattner // Other libraries and framework includes 1530fdc8d8SChris Lattner // Project includes 1630fdc8d8SChris Lattner 1730fdc8d8SChris Lattner static inline int 1830fdc8d8SChris Lattner xdigit_to_sint (char ch) 1930fdc8d8SChris Lattner { 2030fdc8d8SChris Lattner if (ch >= 'a' && ch <= 'f') 2130fdc8d8SChris Lattner return 10 + ch - 'a'; 22*1e89cd80SBenjamin Kramer if (ch >= 'A' && ch <= 'F') 23*1e89cd80SBenjamin Kramer return 10 + ch - 'A'; 2430fdc8d8SChris Lattner return ch - '0'; 2530fdc8d8SChris Lattner } 2630fdc8d8SChris Lattner 2730fdc8d8SChris Lattner static inline unsigned int 2830fdc8d8SChris Lattner xdigit_to_uint (uint8_t ch) 2930fdc8d8SChris Lattner { 3030fdc8d8SChris Lattner if (ch >= 'a' && ch <= 'f') 3130fdc8d8SChris Lattner return 10u + ch - 'a'; 32*1e89cd80SBenjamin Kramer if (ch >= 'A' && ch <= 'F') 33*1e89cd80SBenjamin Kramer return 10u + ch - 'A'; 3430fdc8d8SChris Lattner return ch - '0'; 3530fdc8d8SChris Lattner } 3630fdc8d8SChris Lattner 3730fdc8d8SChris Lattner //---------------------------------------------------------------------- 3830fdc8d8SChris Lattner // StringExtractor constructor 3930fdc8d8SChris Lattner //---------------------------------------------------------------------- 4030fdc8d8SChris Lattner StringExtractor::StringExtractor() : 4130fdc8d8SChris Lattner m_packet(), 4230fdc8d8SChris Lattner m_index (0) 4330fdc8d8SChris Lattner { 4430fdc8d8SChris Lattner } 4530fdc8d8SChris Lattner 4630fdc8d8SChris Lattner 4730fdc8d8SChris Lattner StringExtractor::StringExtractor(const char *packet_cstr) : 4830fdc8d8SChris Lattner m_packet(), 4930fdc8d8SChris Lattner m_index (0) 5030fdc8d8SChris Lattner { 5130fdc8d8SChris Lattner if (packet_cstr) 5230fdc8d8SChris Lattner m_packet.assign (packet_cstr); 5330fdc8d8SChris Lattner } 5430fdc8d8SChris Lattner 5530fdc8d8SChris Lattner 5630fdc8d8SChris Lattner //---------------------------------------------------------------------- 5730fdc8d8SChris Lattner // StringExtractor copy constructor 5830fdc8d8SChris Lattner //---------------------------------------------------------------------- 5930fdc8d8SChris Lattner StringExtractor::StringExtractor(const StringExtractor& rhs) : 6030fdc8d8SChris Lattner m_packet (rhs.m_packet), 6130fdc8d8SChris Lattner m_index (rhs.m_index) 6230fdc8d8SChris Lattner { 6330fdc8d8SChris Lattner 6430fdc8d8SChris Lattner } 6530fdc8d8SChris Lattner 6630fdc8d8SChris Lattner //---------------------------------------------------------------------- 6730fdc8d8SChris Lattner // StringExtractor assignment operator 6830fdc8d8SChris Lattner //---------------------------------------------------------------------- 6930fdc8d8SChris Lattner const StringExtractor& 7030fdc8d8SChris Lattner StringExtractor::operator=(const StringExtractor& rhs) 7130fdc8d8SChris Lattner { 7230fdc8d8SChris Lattner if (this != &rhs) 7330fdc8d8SChris Lattner { 7430fdc8d8SChris Lattner m_packet = rhs.m_packet; 7530fdc8d8SChris Lattner m_index = rhs.m_index; 7630fdc8d8SChris Lattner 7730fdc8d8SChris Lattner } 7830fdc8d8SChris Lattner return *this; 7930fdc8d8SChris Lattner } 8030fdc8d8SChris Lattner 8130fdc8d8SChris Lattner //---------------------------------------------------------------------- 8230fdc8d8SChris Lattner // Destructor 8330fdc8d8SChris Lattner //---------------------------------------------------------------------- 8430fdc8d8SChris Lattner StringExtractor::~StringExtractor() 8530fdc8d8SChris Lattner { 8630fdc8d8SChris Lattner } 8730fdc8d8SChris Lattner 8830fdc8d8SChris Lattner 8930fdc8d8SChris Lattner char 9030fdc8d8SChris Lattner StringExtractor::GetChar (char fail_value) 9130fdc8d8SChris Lattner { 9230fdc8d8SChris Lattner if (m_index < m_packet.size()) 9330fdc8d8SChris Lattner { 9430fdc8d8SChris Lattner char ch = m_packet[m_index]; 9530fdc8d8SChris Lattner ++m_index; 9630fdc8d8SChris Lattner return ch; 9730fdc8d8SChris Lattner } 9830fdc8d8SChris Lattner m_index = UINT32_MAX; 9930fdc8d8SChris Lattner return fail_value; 10030fdc8d8SChris Lattner } 10130fdc8d8SChris Lattner 10230fdc8d8SChris Lattner uint32_t 10330fdc8d8SChris Lattner StringExtractor::GetNumHexASCIICharsAtFilePos (uint32_t max) const 10430fdc8d8SChris Lattner { 10530fdc8d8SChris Lattner uint32_t idx = m_index; 10630fdc8d8SChris Lattner const size_t size = m_packet.size(); 10730fdc8d8SChris Lattner while (idx < size && idx - m_index < max && isxdigit(m_packet[idx])) 10830fdc8d8SChris Lattner ++idx; 10930fdc8d8SChris Lattner return idx - m_index; 11030fdc8d8SChris Lattner } 11130fdc8d8SChris Lattner //---------------------------------------------------------------------- 11230fdc8d8SChris Lattner // Extract a signed character from two hex ASCII chars in the packet 11330fdc8d8SChris Lattner // string 11430fdc8d8SChris Lattner //---------------------------------------------------------------------- 11530fdc8d8SChris Lattner int8_t 11630fdc8d8SChris Lattner StringExtractor::GetHexS8 (int8_t fail_value) 11730fdc8d8SChris Lattner { 11830fdc8d8SChris Lattner if (GetNumHexASCIICharsAtFilePos(2)) 11930fdc8d8SChris Lattner { 12030fdc8d8SChris Lattner char hi_nibble_char = m_packet[m_index]; 12130fdc8d8SChris Lattner char lo_nibble_char = m_packet[m_index+1]; 12230fdc8d8SChris Lattner 12330fdc8d8SChris Lattner if (isxdigit(hi_nibble_char) && isxdigit(lo_nibble_char)) 12430fdc8d8SChris Lattner { 12530fdc8d8SChris Lattner char hi_nibble = xdigit_to_sint (hi_nibble_char); 12630fdc8d8SChris Lattner char lo_nibble = xdigit_to_sint (lo_nibble_char); 12730fdc8d8SChris Lattner m_index += 2; 12830fdc8d8SChris Lattner return (hi_nibble << 4) + lo_nibble; 12930fdc8d8SChris Lattner } 13030fdc8d8SChris Lattner } 13130fdc8d8SChris Lattner m_index = UINT32_MAX; 13230fdc8d8SChris Lattner return fail_value; 13330fdc8d8SChris Lattner } 13430fdc8d8SChris Lattner 13530fdc8d8SChris Lattner //---------------------------------------------------------------------- 13630fdc8d8SChris Lattner // Extract an unsigned character from two hex ASCII chars in the packet 13730fdc8d8SChris Lattner // string 13830fdc8d8SChris Lattner //---------------------------------------------------------------------- 13930fdc8d8SChris Lattner uint8_t 14030fdc8d8SChris Lattner StringExtractor::GetHexU8 (uint8_t fail_value) 14130fdc8d8SChris Lattner { 14230fdc8d8SChris Lattner if (GetNumHexASCIICharsAtFilePos(2)) 14330fdc8d8SChris Lattner { 14430fdc8d8SChris Lattner uint8_t hi_nibble_char = m_packet[m_index]; 14530fdc8d8SChris Lattner uint8_t lo_nibble_char = m_packet[m_index+1]; 14630fdc8d8SChris Lattner 14730fdc8d8SChris Lattner if (isxdigit(hi_nibble_char) && isxdigit(lo_nibble_char)) 14830fdc8d8SChris Lattner { 14930fdc8d8SChris Lattner uint8_t hi_nibble = xdigit_to_sint (hi_nibble_char); 15030fdc8d8SChris Lattner uint8_t lo_nibble = xdigit_to_sint (lo_nibble_char); 15130fdc8d8SChris Lattner m_index += 2; 15230fdc8d8SChris Lattner return (hi_nibble << 4) + lo_nibble; 15330fdc8d8SChris Lattner } 15430fdc8d8SChris Lattner } 15530fdc8d8SChris Lattner m_index = UINT32_MAX; 15630fdc8d8SChris Lattner return fail_value; 15730fdc8d8SChris Lattner } 15830fdc8d8SChris Lattner 15930fdc8d8SChris Lattner uint32_t 16030fdc8d8SChris Lattner StringExtractor::GetHexMaxU32 (bool little_endian, uint32_t fail_value) 16130fdc8d8SChris Lattner { 16230fdc8d8SChris Lattner uint32_t result = 0; 16330fdc8d8SChris Lattner uint32_t nibble_count = 0; 16430fdc8d8SChris Lattner 16530fdc8d8SChris Lattner if (little_endian) 16630fdc8d8SChris Lattner { 16730fdc8d8SChris Lattner uint32_t shift_amount = 0; 16830fdc8d8SChris Lattner while (m_index < m_packet.size() && ::isxdigit (m_packet[m_index])) 16930fdc8d8SChris Lattner { 17030fdc8d8SChris Lattner // Make sure we don't exceed the size of a uint32_t... 17130fdc8d8SChris Lattner if (nibble_count >= (sizeof(uint32_t) * 2)) 17230fdc8d8SChris Lattner { 17330fdc8d8SChris Lattner m_index = UINT32_MAX; 17430fdc8d8SChris Lattner return fail_value; 17530fdc8d8SChris Lattner } 17630fdc8d8SChris Lattner 17730fdc8d8SChris Lattner uint8_t nibble_lo; 17830fdc8d8SChris Lattner uint8_t nibble_hi = xdigit_to_sint (m_packet[m_index]); 17930fdc8d8SChris Lattner ++m_index; 18030fdc8d8SChris Lattner if (m_index < m_packet.size() && ::isxdigit (m_packet[m_index])) 18130fdc8d8SChris Lattner { 18230fdc8d8SChris Lattner nibble_lo = xdigit_to_sint (m_packet[m_index]); 18330fdc8d8SChris Lattner ++m_index; 18430fdc8d8SChris Lattner result |= ((uint32_t)nibble_hi << (shift_amount + 4)); 18530fdc8d8SChris Lattner result |= ((uint32_t)nibble_lo << shift_amount); 18630fdc8d8SChris Lattner nibble_count += 2; 18730fdc8d8SChris Lattner shift_amount += 8; 18830fdc8d8SChris Lattner } 18930fdc8d8SChris Lattner else 19030fdc8d8SChris Lattner { 19130fdc8d8SChris Lattner result |= ((uint32_t)nibble_hi << shift_amount); 19230fdc8d8SChris Lattner nibble_count += 1; 19330fdc8d8SChris Lattner shift_amount += 4; 19430fdc8d8SChris Lattner } 19530fdc8d8SChris Lattner 19630fdc8d8SChris Lattner } 19730fdc8d8SChris Lattner } 19830fdc8d8SChris Lattner else 19930fdc8d8SChris Lattner { 20030fdc8d8SChris Lattner while (m_index < m_packet.size() && ::isxdigit (m_packet[m_index])) 20130fdc8d8SChris Lattner { 20230fdc8d8SChris Lattner // Make sure we don't exceed the size of a uint32_t... 20330fdc8d8SChris Lattner if (nibble_count >= (sizeof(uint32_t) * 2)) 20430fdc8d8SChris Lattner { 20530fdc8d8SChris Lattner m_index = UINT32_MAX; 20630fdc8d8SChris Lattner return fail_value; 20730fdc8d8SChris Lattner } 20830fdc8d8SChris Lattner 20930fdc8d8SChris Lattner uint8_t nibble = xdigit_to_sint (m_packet[m_index]); 21030fdc8d8SChris Lattner // Big Endian 21130fdc8d8SChris Lattner result <<= 4; 21230fdc8d8SChris Lattner result |= nibble; 21330fdc8d8SChris Lattner 21430fdc8d8SChris Lattner ++m_index; 21530fdc8d8SChris Lattner ++nibble_count; 21630fdc8d8SChris Lattner } 21730fdc8d8SChris Lattner } 21830fdc8d8SChris Lattner return result; 21930fdc8d8SChris Lattner } 22030fdc8d8SChris Lattner 22130fdc8d8SChris Lattner uint64_t 22230fdc8d8SChris Lattner StringExtractor::GetHexMaxU64 (bool little_endian, uint64_t fail_value) 22330fdc8d8SChris Lattner { 22430fdc8d8SChris Lattner uint64_t result = 0; 22530fdc8d8SChris Lattner uint32_t nibble_count = 0; 22630fdc8d8SChris Lattner 22730fdc8d8SChris Lattner if (little_endian) 22830fdc8d8SChris Lattner { 22930fdc8d8SChris Lattner uint32_t shift_amount = 0; 23030fdc8d8SChris Lattner while (m_index < m_packet.size() && ::isxdigit (m_packet[m_index])) 23130fdc8d8SChris Lattner { 23230fdc8d8SChris Lattner // Make sure we don't exceed the size of a uint64_t... 23330fdc8d8SChris Lattner if (nibble_count >= (sizeof(uint64_t) * 2)) 23430fdc8d8SChris Lattner { 23530fdc8d8SChris Lattner m_index = UINT32_MAX; 23630fdc8d8SChris Lattner return fail_value; 23730fdc8d8SChris Lattner } 23830fdc8d8SChris Lattner 23930fdc8d8SChris Lattner uint8_t nibble_lo; 24030fdc8d8SChris Lattner uint8_t nibble_hi = xdigit_to_sint (m_packet[m_index]); 24130fdc8d8SChris Lattner ++m_index; 24230fdc8d8SChris Lattner if (m_index < m_packet.size() && ::isxdigit (m_packet[m_index])) 24330fdc8d8SChris Lattner { 24430fdc8d8SChris Lattner nibble_lo = xdigit_to_sint (m_packet[m_index]); 24530fdc8d8SChris Lattner ++m_index; 24630fdc8d8SChris Lattner result |= ((uint64_t)nibble_hi << (shift_amount + 4)); 24730fdc8d8SChris Lattner result |= ((uint64_t)nibble_lo << shift_amount); 24830fdc8d8SChris Lattner nibble_count += 2; 24930fdc8d8SChris Lattner shift_amount += 8; 25030fdc8d8SChris Lattner } 25130fdc8d8SChris Lattner else 25230fdc8d8SChris Lattner { 25330fdc8d8SChris Lattner result |= ((uint64_t)nibble_hi << shift_amount); 25430fdc8d8SChris Lattner nibble_count += 1; 25530fdc8d8SChris Lattner shift_amount += 4; 25630fdc8d8SChris Lattner } 25730fdc8d8SChris Lattner 25830fdc8d8SChris Lattner } 25930fdc8d8SChris Lattner } 26030fdc8d8SChris Lattner else 26130fdc8d8SChris Lattner { 26230fdc8d8SChris Lattner while (m_index < m_packet.size() && ::isxdigit (m_packet[m_index])) 26330fdc8d8SChris Lattner { 26430fdc8d8SChris Lattner // Make sure we don't exceed the size of a uint64_t... 26530fdc8d8SChris Lattner if (nibble_count >= (sizeof(uint64_t) * 2)) 26630fdc8d8SChris Lattner { 26730fdc8d8SChris Lattner m_index = UINT32_MAX; 26830fdc8d8SChris Lattner return fail_value; 26930fdc8d8SChris Lattner } 27030fdc8d8SChris Lattner 27130fdc8d8SChris Lattner uint8_t nibble = xdigit_to_sint (m_packet[m_index]); 27230fdc8d8SChris Lattner // Big Endian 27330fdc8d8SChris Lattner result <<= 4; 27430fdc8d8SChris Lattner result |= nibble; 27530fdc8d8SChris Lattner 27630fdc8d8SChris Lattner ++m_index; 27730fdc8d8SChris Lattner ++nibble_count; 27830fdc8d8SChris Lattner } 27930fdc8d8SChris Lattner } 28030fdc8d8SChris Lattner return result; 28130fdc8d8SChris Lattner } 28230fdc8d8SChris Lattner 28330fdc8d8SChris Lattner size_t 28430fdc8d8SChris Lattner StringExtractor::GetHexBytes (void *dst_void, size_t dst_len, uint8_t fail_fill_value) 28530fdc8d8SChris Lattner { 28630fdc8d8SChris Lattner uint8_t *dst = (uint8_t*)dst_void; 28730fdc8d8SChris Lattner size_t bytes_extracted = 0; 28830fdc8d8SChris Lattner while (bytes_extracted < dst_len && GetBytesLeft ()) 28930fdc8d8SChris Lattner { 29030fdc8d8SChris Lattner dst[bytes_extracted] = GetHexU8 (fail_fill_value); 29130fdc8d8SChris Lattner if (IsGood()) 29230fdc8d8SChris Lattner ++bytes_extracted; 29330fdc8d8SChris Lattner else 29430fdc8d8SChris Lattner break; 29530fdc8d8SChris Lattner } 29630fdc8d8SChris Lattner 29730fdc8d8SChris Lattner for (size_t i = bytes_extracted; i < dst_len; ++i) 29830fdc8d8SChris Lattner dst[i] = fail_fill_value; 29930fdc8d8SChris Lattner 30030fdc8d8SChris Lattner return bytes_extracted; 30130fdc8d8SChris Lattner } 30230fdc8d8SChris Lattner 30330fdc8d8SChris Lattner 30430fdc8d8SChris Lattner // Consume ASCII hex nibble character pairs until we have decoded byte_size 30530fdc8d8SChris Lattner // bytes of data. 30630fdc8d8SChris Lattner 30730fdc8d8SChris Lattner uint64_t 30830fdc8d8SChris Lattner StringExtractor::GetHexWithFixedSize (uint32_t byte_size, bool little_endian, uint64_t fail_value) 30930fdc8d8SChris Lattner { 31030fdc8d8SChris Lattner if (byte_size <= 8 && GetBytesLeft() >= byte_size * 2) 31130fdc8d8SChris Lattner { 31230fdc8d8SChris Lattner uint64_t result = 0; 31330fdc8d8SChris Lattner uint32_t i; 31430fdc8d8SChris Lattner if (little_endian) 31530fdc8d8SChris Lattner { 31630fdc8d8SChris Lattner // Little Endian 31730fdc8d8SChris Lattner uint32_t shift_amount; 31830fdc8d8SChris Lattner for (i = 0, shift_amount = 0; 31930fdc8d8SChris Lattner i < byte_size && m_index != UINT32_MAX; 32030fdc8d8SChris Lattner ++i, shift_amount += 8) 32130fdc8d8SChris Lattner { 32230fdc8d8SChris Lattner result |= ((uint64_t)GetHexU8() << shift_amount); 32330fdc8d8SChris Lattner } 32430fdc8d8SChris Lattner } 32530fdc8d8SChris Lattner else 32630fdc8d8SChris Lattner { 32730fdc8d8SChris Lattner // Big Endian 32830fdc8d8SChris Lattner for (i = 0; i < byte_size && m_index != UINT32_MAX; ++i) 32930fdc8d8SChris Lattner { 33030fdc8d8SChris Lattner result <<= 8; 33130fdc8d8SChris Lattner result |= GetHexU8(); 33230fdc8d8SChris Lattner } 33330fdc8d8SChris Lattner } 33430fdc8d8SChris Lattner } 33530fdc8d8SChris Lattner m_index = UINT32_MAX; 33630fdc8d8SChris Lattner return fail_value; 33730fdc8d8SChris Lattner } 33830fdc8d8SChris Lattner 33930fdc8d8SChris Lattner bool 34030fdc8d8SChris Lattner StringExtractor::GetNameColonValue (std::string &name, std::string &value) 34130fdc8d8SChris Lattner { 34230fdc8d8SChris Lattner // Read something in the form of NNNN:VVVV; where NNNN is any character 34330fdc8d8SChris Lattner // that is not a colon, followed by a ':' character, then a value (one or 34430fdc8d8SChris Lattner // more ';' chars), followed by a ';' 34530fdc8d8SChris Lattner if (m_index < m_packet.size()) 34630fdc8d8SChris Lattner { 34730fdc8d8SChris Lattner const size_t colon_idx = m_packet.find (':', m_index); 34830fdc8d8SChris Lattner if (colon_idx != std::string::npos) 34930fdc8d8SChris Lattner { 35030fdc8d8SChris Lattner const size_t semicolon_idx = m_packet.find (';', colon_idx); 35130fdc8d8SChris Lattner if (semicolon_idx != std::string::npos) 35230fdc8d8SChris Lattner { 35330fdc8d8SChris Lattner name.assign (m_packet, m_index, colon_idx - m_index); 35430fdc8d8SChris Lattner value.assign (m_packet, colon_idx + 1, semicolon_idx - (colon_idx + 1)); 35530fdc8d8SChris Lattner m_index = semicolon_idx + 1; 35630fdc8d8SChris Lattner return true; 35730fdc8d8SChris Lattner } 35830fdc8d8SChris Lattner } 35930fdc8d8SChris Lattner } 36030fdc8d8SChris Lattner m_index = UINT32_MAX; 36130fdc8d8SChris Lattner return false; 36230fdc8d8SChris Lattner } 363