130fdc8d8SChris Lattner //===-- StringExtractor.cpp -------------------------------------*- C++ -*-===//
230fdc8d8SChris Lattner //
330fdc8d8SChris Lattner //                     The LLVM Compiler Infrastructure
430fdc8d8SChris Lattner //
530fdc8d8SChris Lattner // This file is distributed under the University of Illinois Open Source
630fdc8d8SChris Lattner // License. See LICENSE.TXT for details.
730fdc8d8SChris Lattner //
830fdc8d8SChris Lattner //===----------------------------------------------------------------------===//
930fdc8d8SChris Lattner 
10c982c768SGreg Clayton #include "Utility/StringExtractor.h"
1130fdc8d8SChris Lattner 
1230fdc8d8SChris Lattner // C Includes
1378709173SStephen Wilson #include <stdlib.h>
1478709173SStephen Wilson 
1530fdc8d8SChris Lattner // C++ Includes
1630fdc8d8SChris Lattner // Other libraries and framework includes
1730fdc8d8SChris Lattner // Project includes
1830fdc8d8SChris Lattner 
1930fdc8d8SChris Lattner static inline int
2030fdc8d8SChris Lattner xdigit_to_sint (char ch)
2130fdc8d8SChris Lattner {
2230fdc8d8SChris Lattner     if (ch >= 'a' && ch <= 'f')
2330fdc8d8SChris Lattner         return 10 + ch - 'a';
241e89cd80SBenjamin Kramer     if (ch >= 'A' && ch <= 'F')
251e89cd80SBenjamin Kramer         return 10 + ch - 'A';
2630fdc8d8SChris Lattner     return ch - '0';
2730fdc8d8SChris Lattner }
2830fdc8d8SChris Lattner 
2930fdc8d8SChris Lattner static inline unsigned int
3030fdc8d8SChris Lattner xdigit_to_uint (uint8_t ch)
3130fdc8d8SChris Lattner {
3230fdc8d8SChris Lattner     if (ch >= 'a' && ch <= 'f')
3330fdc8d8SChris Lattner         return 10u + ch - 'a';
341e89cd80SBenjamin Kramer     if (ch >= 'A' && ch <= 'F')
351e89cd80SBenjamin Kramer         return 10u + ch - 'A';
3630fdc8d8SChris Lattner     return ch - '0';
3730fdc8d8SChris Lattner }
3830fdc8d8SChris Lattner 
3930fdc8d8SChris Lattner //----------------------------------------------------------------------
4030fdc8d8SChris Lattner // StringExtractor constructor
4130fdc8d8SChris Lattner //----------------------------------------------------------------------
4230fdc8d8SChris Lattner StringExtractor::StringExtractor() :
4330fdc8d8SChris Lattner     m_packet(),
4430fdc8d8SChris Lattner     m_index (0)
4530fdc8d8SChris Lattner {
4630fdc8d8SChris Lattner }
4730fdc8d8SChris Lattner 
4830fdc8d8SChris Lattner 
4930fdc8d8SChris Lattner StringExtractor::StringExtractor(const char *packet_cstr) :
5030fdc8d8SChris Lattner     m_packet(),
5130fdc8d8SChris Lattner     m_index (0)
5230fdc8d8SChris Lattner {
5330fdc8d8SChris Lattner     if (packet_cstr)
5430fdc8d8SChris Lattner         m_packet.assign (packet_cstr);
5530fdc8d8SChris Lattner }
5630fdc8d8SChris Lattner 
5730fdc8d8SChris Lattner 
5830fdc8d8SChris Lattner //----------------------------------------------------------------------
5930fdc8d8SChris Lattner // StringExtractor copy constructor
6030fdc8d8SChris Lattner //----------------------------------------------------------------------
6130fdc8d8SChris Lattner StringExtractor::StringExtractor(const StringExtractor& rhs) :
6230fdc8d8SChris Lattner     m_packet (rhs.m_packet),
6330fdc8d8SChris Lattner     m_index (rhs.m_index)
6430fdc8d8SChris Lattner {
6530fdc8d8SChris Lattner 
6630fdc8d8SChris Lattner }
6730fdc8d8SChris Lattner 
6830fdc8d8SChris Lattner //----------------------------------------------------------------------
6930fdc8d8SChris Lattner // StringExtractor assignment operator
7030fdc8d8SChris Lattner //----------------------------------------------------------------------
7130fdc8d8SChris Lattner const StringExtractor&
7230fdc8d8SChris Lattner StringExtractor::operator=(const StringExtractor& rhs)
7330fdc8d8SChris Lattner {
7430fdc8d8SChris Lattner     if (this != &rhs)
7530fdc8d8SChris Lattner     {
7630fdc8d8SChris Lattner         m_packet = rhs.m_packet;
7730fdc8d8SChris Lattner         m_index = rhs.m_index;
7830fdc8d8SChris Lattner 
7930fdc8d8SChris Lattner     }
8030fdc8d8SChris Lattner     return *this;
8130fdc8d8SChris Lattner }
8230fdc8d8SChris Lattner 
8330fdc8d8SChris Lattner //----------------------------------------------------------------------
8430fdc8d8SChris Lattner // Destructor
8530fdc8d8SChris Lattner //----------------------------------------------------------------------
8630fdc8d8SChris Lattner StringExtractor::~StringExtractor()
8730fdc8d8SChris Lattner {
8830fdc8d8SChris Lattner }
8930fdc8d8SChris Lattner 
9030fdc8d8SChris Lattner 
9130fdc8d8SChris Lattner char
9230fdc8d8SChris Lattner StringExtractor::GetChar (char fail_value)
9330fdc8d8SChris Lattner {
9430fdc8d8SChris Lattner     if (m_index < m_packet.size())
9530fdc8d8SChris Lattner     {
9630fdc8d8SChris Lattner         char ch = m_packet[m_index];
9730fdc8d8SChris Lattner         ++m_index;
9830fdc8d8SChris Lattner         return ch;
9930fdc8d8SChris Lattner     }
10030fdc8d8SChris Lattner     m_index = UINT32_MAX;
10130fdc8d8SChris Lattner     return fail_value;
10230fdc8d8SChris Lattner }
10330fdc8d8SChris Lattner 
10430fdc8d8SChris Lattner uint32_t
10530fdc8d8SChris Lattner StringExtractor::GetNumHexASCIICharsAtFilePos (uint32_t max) const
10630fdc8d8SChris Lattner {
10730fdc8d8SChris Lattner     uint32_t idx = m_index;
10830fdc8d8SChris Lattner     const size_t size = m_packet.size();
10930fdc8d8SChris Lattner     while (idx < size && idx - m_index < max && isxdigit(m_packet[idx]))
11030fdc8d8SChris Lattner         ++idx;
11130fdc8d8SChris Lattner     return idx - m_index;
11230fdc8d8SChris Lattner }
11330fdc8d8SChris Lattner //----------------------------------------------------------------------
11430fdc8d8SChris Lattner // Extract a signed character from two hex ASCII chars in the packet
11530fdc8d8SChris Lattner // string
11630fdc8d8SChris Lattner //----------------------------------------------------------------------
11730fdc8d8SChris Lattner int8_t
11830fdc8d8SChris Lattner StringExtractor::GetHexS8 (int8_t fail_value)
11930fdc8d8SChris Lattner {
12030fdc8d8SChris Lattner     if (GetNumHexASCIICharsAtFilePos(2))
12130fdc8d8SChris Lattner     {
12230fdc8d8SChris Lattner         char hi_nibble_char = m_packet[m_index];
12330fdc8d8SChris Lattner         char lo_nibble_char = m_packet[m_index+1];
12430fdc8d8SChris Lattner         char hi_nibble = xdigit_to_sint (hi_nibble_char);
12530fdc8d8SChris Lattner         char lo_nibble = xdigit_to_sint (lo_nibble_char);
12630fdc8d8SChris Lattner         m_index += 2;
12730fdc8d8SChris Lattner         return (hi_nibble << 4) + lo_nibble;
12830fdc8d8SChris Lattner     }
12930fdc8d8SChris Lattner     m_index = UINT32_MAX;
13030fdc8d8SChris Lattner     return fail_value;
13130fdc8d8SChris Lattner }
13230fdc8d8SChris Lattner 
13330fdc8d8SChris Lattner //----------------------------------------------------------------------
13430fdc8d8SChris Lattner // Extract an unsigned character from two hex ASCII chars in the packet
13530fdc8d8SChris Lattner // string
13630fdc8d8SChris Lattner //----------------------------------------------------------------------
13730fdc8d8SChris Lattner uint8_t
138*7b70be39SGreg Clayton StringExtractor::GetHexU8 (uint8_t fail_value, bool set_eof_on_fail)
13930fdc8d8SChris Lattner {
14030fdc8d8SChris Lattner     if (GetNumHexASCIICharsAtFilePos(2))
14130fdc8d8SChris Lattner     {
14230fdc8d8SChris Lattner         uint8_t hi_nibble_char = m_packet[m_index];
14330fdc8d8SChris Lattner         uint8_t lo_nibble_char = m_packet[m_index+1];
14471337622SGreg Clayton         uint8_t hi_nibble = xdigit_to_uint (hi_nibble_char);
14571337622SGreg Clayton         uint8_t lo_nibble = xdigit_to_uint (lo_nibble_char);
14630fdc8d8SChris Lattner         m_index += 2;
14730fdc8d8SChris Lattner         return (hi_nibble << 4) + lo_nibble;
14830fdc8d8SChris Lattner     }
149*7b70be39SGreg Clayton     if (set_eof_on_fail || m_index >= m_packet.size())
15030fdc8d8SChris Lattner         m_index = UINT32_MAX;
15130fdc8d8SChris Lattner     return fail_value;
15230fdc8d8SChris Lattner }
15330fdc8d8SChris Lattner 
15430fdc8d8SChris Lattner uint32_t
15532e0a750SGreg Clayton StringExtractor::GetU32 (uint32_t fail_value, int base)
15632e0a750SGreg Clayton {
15732e0a750SGreg Clayton     if (m_index < m_packet.size())
15832e0a750SGreg Clayton     {
15932e0a750SGreg Clayton         char *end = NULL;
16032e0a750SGreg Clayton         const char *start = m_packet.c_str();
16132e0a750SGreg Clayton         const char *uint_cstr = start + m_index;
16232e0a750SGreg Clayton         uint32_t result = ::strtoul (uint_cstr, &end, base);
16332e0a750SGreg Clayton 
16432e0a750SGreg Clayton         if (end && end != uint_cstr)
16532e0a750SGreg Clayton         {
16632e0a750SGreg Clayton             m_index = end - start;
16732e0a750SGreg Clayton             return result;
16832e0a750SGreg Clayton         }
16932e0a750SGreg Clayton     }
17032e0a750SGreg Clayton     return fail_value;
17132e0a750SGreg Clayton }
17232e0a750SGreg Clayton 
17332e0a750SGreg Clayton 
17432e0a750SGreg Clayton uint32_t
17530fdc8d8SChris Lattner StringExtractor::GetHexMaxU32 (bool little_endian, uint32_t fail_value)
17630fdc8d8SChris Lattner {
17730fdc8d8SChris Lattner     uint32_t result = 0;
17830fdc8d8SChris Lattner     uint32_t nibble_count = 0;
17930fdc8d8SChris Lattner 
18030fdc8d8SChris Lattner     if (little_endian)
18130fdc8d8SChris Lattner     {
18230fdc8d8SChris Lattner         uint32_t shift_amount = 0;
18330fdc8d8SChris Lattner         while (m_index < m_packet.size() && ::isxdigit (m_packet[m_index]))
18430fdc8d8SChris Lattner         {
18530fdc8d8SChris Lattner             // Make sure we don't exceed the size of a uint32_t...
18630fdc8d8SChris Lattner             if (nibble_count >= (sizeof(uint32_t) * 2))
18730fdc8d8SChris Lattner             {
18830fdc8d8SChris Lattner                 m_index = UINT32_MAX;
18930fdc8d8SChris Lattner                 return fail_value;
19030fdc8d8SChris Lattner             }
19130fdc8d8SChris Lattner 
19230fdc8d8SChris Lattner             uint8_t nibble_lo;
19330fdc8d8SChris Lattner             uint8_t nibble_hi = xdigit_to_sint (m_packet[m_index]);
19430fdc8d8SChris Lattner             ++m_index;
19530fdc8d8SChris Lattner             if (m_index < m_packet.size() && ::isxdigit (m_packet[m_index]))
19630fdc8d8SChris Lattner             {
19730fdc8d8SChris Lattner                 nibble_lo = xdigit_to_sint (m_packet[m_index]);
19830fdc8d8SChris Lattner                 ++m_index;
19930fdc8d8SChris Lattner                 result |= ((uint32_t)nibble_hi << (shift_amount + 4));
20030fdc8d8SChris Lattner                 result |= ((uint32_t)nibble_lo << shift_amount);
20130fdc8d8SChris Lattner                 nibble_count += 2;
20230fdc8d8SChris Lattner                 shift_amount += 8;
20330fdc8d8SChris Lattner             }
20430fdc8d8SChris Lattner             else
20530fdc8d8SChris Lattner             {
20630fdc8d8SChris Lattner                 result |= ((uint32_t)nibble_hi << shift_amount);
20730fdc8d8SChris Lattner                 nibble_count += 1;
20830fdc8d8SChris Lattner                 shift_amount += 4;
20930fdc8d8SChris Lattner             }
21030fdc8d8SChris Lattner 
21130fdc8d8SChris Lattner         }
21230fdc8d8SChris Lattner     }
21330fdc8d8SChris Lattner     else
21430fdc8d8SChris Lattner     {
21530fdc8d8SChris Lattner         while (m_index < m_packet.size() && ::isxdigit (m_packet[m_index]))
21630fdc8d8SChris Lattner         {
21730fdc8d8SChris Lattner             // Make sure we don't exceed the size of a uint32_t...
21830fdc8d8SChris Lattner             if (nibble_count >= (sizeof(uint32_t) * 2))
21930fdc8d8SChris Lattner             {
22030fdc8d8SChris Lattner                 m_index = UINT32_MAX;
22130fdc8d8SChris Lattner                 return fail_value;
22230fdc8d8SChris Lattner             }
22330fdc8d8SChris Lattner 
22430fdc8d8SChris Lattner             uint8_t nibble = xdigit_to_sint (m_packet[m_index]);
22530fdc8d8SChris Lattner             // Big Endian
22630fdc8d8SChris Lattner             result <<= 4;
22730fdc8d8SChris Lattner             result |= nibble;
22830fdc8d8SChris Lattner 
22930fdc8d8SChris Lattner             ++m_index;
23030fdc8d8SChris Lattner             ++nibble_count;
23130fdc8d8SChris Lattner         }
23230fdc8d8SChris Lattner     }
23330fdc8d8SChris Lattner     return result;
23430fdc8d8SChris Lattner }
23530fdc8d8SChris Lattner 
23630fdc8d8SChris Lattner uint64_t
23730fdc8d8SChris Lattner StringExtractor::GetHexMaxU64 (bool little_endian, uint64_t fail_value)
23830fdc8d8SChris Lattner {
23930fdc8d8SChris Lattner     uint64_t result = 0;
24030fdc8d8SChris Lattner     uint32_t nibble_count = 0;
24130fdc8d8SChris Lattner 
24230fdc8d8SChris Lattner     if (little_endian)
24330fdc8d8SChris Lattner     {
24430fdc8d8SChris Lattner         uint32_t shift_amount = 0;
24530fdc8d8SChris Lattner         while (m_index < m_packet.size() && ::isxdigit (m_packet[m_index]))
24630fdc8d8SChris Lattner         {
24730fdc8d8SChris Lattner             // Make sure we don't exceed the size of a uint64_t...
24830fdc8d8SChris Lattner             if (nibble_count >= (sizeof(uint64_t) * 2))
24930fdc8d8SChris Lattner             {
25030fdc8d8SChris Lattner                 m_index = UINT32_MAX;
25130fdc8d8SChris Lattner                 return fail_value;
25230fdc8d8SChris Lattner             }
25330fdc8d8SChris Lattner 
25430fdc8d8SChris Lattner             uint8_t nibble_lo;
25530fdc8d8SChris Lattner             uint8_t nibble_hi = xdigit_to_sint (m_packet[m_index]);
25630fdc8d8SChris Lattner             ++m_index;
25730fdc8d8SChris Lattner             if (m_index < m_packet.size() && ::isxdigit (m_packet[m_index]))
25830fdc8d8SChris Lattner             {
25930fdc8d8SChris Lattner                 nibble_lo = xdigit_to_sint (m_packet[m_index]);
26030fdc8d8SChris Lattner                 ++m_index;
26130fdc8d8SChris Lattner                 result |= ((uint64_t)nibble_hi << (shift_amount + 4));
26230fdc8d8SChris Lattner                 result |= ((uint64_t)nibble_lo << shift_amount);
26330fdc8d8SChris Lattner                 nibble_count += 2;
26430fdc8d8SChris Lattner                 shift_amount += 8;
26530fdc8d8SChris Lattner             }
26630fdc8d8SChris Lattner             else
26730fdc8d8SChris Lattner             {
26830fdc8d8SChris Lattner                 result |= ((uint64_t)nibble_hi << shift_amount);
26930fdc8d8SChris Lattner                 nibble_count += 1;
27030fdc8d8SChris Lattner                 shift_amount += 4;
27130fdc8d8SChris Lattner             }
27230fdc8d8SChris Lattner 
27330fdc8d8SChris Lattner         }
27430fdc8d8SChris Lattner     }
27530fdc8d8SChris Lattner     else
27630fdc8d8SChris Lattner     {
27730fdc8d8SChris Lattner         while (m_index < m_packet.size() && ::isxdigit (m_packet[m_index]))
27830fdc8d8SChris Lattner         {
27930fdc8d8SChris Lattner             // Make sure we don't exceed the size of a uint64_t...
28030fdc8d8SChris Lattner             if (nibble_count >= (sizeof(uint64_t) * 2))
28130fdc8d8SChris Lattner             {
28230fdc8d8SChris Lattner                 m_index = UINT32_MAX;
28330fdc8d8SChris Lattner                 return fail_value;
28430fdc8d8SChris Lattner             }
28530fdc8d8SChris Lattner 
28630fdc8d8SChris Lattner             uint8_t nibble = xdigit_to_sint (m_packet[m_index]);
28730fdc8d8SChris Lattner             // Big Endian
28830fdc8d8SChris Lattner             result <<= 4;
28930fdc8d8SChris Lattner             result |= nibble;
29030fdc8d8SChris Lattner 
29130fdc8d8SChris Lattner             ++m_index;
29230fdc8d8SChris Lattner             ++nibble_count;
29330fdc8d8SChris Lattner         }
29430fdc8d8SChris Lattner     }
29530fdc8d8SChris Lattner     return result;
29630fdc8d8SChris Lattner }
29730fdc8d8SChris Lattner 
29830fdc8d8SChris Lattner size_t
29930fdc8d8SChris Lattner StringExtractor::GetHexBytes (void *dst_void, size_t dst_len, uint8_t fail_fill_value)
30030fdc8d8SChris Lattner {
30130fdc8d8SChris Lattner     uint8_t *dst = (uint8_t*)dst_void;
30230fdc8d8SChris Lattner     size_t bytes_extracted = 0;
30330fdc8d8SChris Lattner     while (bytes_extracted < dst_len && GetBytesLeft ())
30430fdc8d8SChris Lattner     {
30530fdc8d8SChris Lattner         dst[bytes_extracted] = GetHexU8 (fail_fill_value);
30630fdc8d8SChris Lattner         if (IsGood())
30730fdc8d8SChris Lattner             ++bytes_extracted;
30830fdc8d8SChris Lattner         else
30930fdc8d8SChris Lattner             break;
31030fdc8d8SChris Lattner     }
31130fdc8d8SChris Lattner 
31230fdc8d8SChris Lattner     for (size_t i = bytes_extracted; i < dst_len; ++i)
31330fdc8d8SChris Lattner         dst[i] = fail_fill_value;
31430fdc8d8SChris Lattner 
31530fdc8d8SChris Lattner     return bytes_extracted;
31630fdc8d8SChris Lattner }
31730fdc8d8SChris Lattner 
31830fdc8d8SChris Lattner 
31930fdc8d8SChris Lattner // Consume ASCII hex nibble character pairs until we have decoded byte_size
32030fdc8d8SChris Lattner // bytes of data.
32130fdc8d8SChris Lattner 
32230fdc8d8SChris Lattner uint64_t
32330fdc8d8SChris Lattner StringExtractor::GetHexWithFixedSize (uint32_t byte_size, bool little_endian, uint64_t fail_value)
32430fdc8d8SChris Lattner {
32530fdc8d8SChris Lattner     if (byte_size <= 8 && GetBytesLeft() >= byte_size * 2)
32630fdc8d8SChris Lattner     {
32730fdc8d8SChris Lattner         uint64_t result = 0;
32830fdc8d8SChris Lattner         uint32_t i;
32930fdc8d8SChris Lattner         if (little_endian)
33030fdc8d8SChris Lattner         {
33130fdc8d8SChris Lattner             // Little Endian
33230fdc8d8SChris Lattner             uint32_t shift_amount;
33330fdc8d8SChris Lattner             for (i = 0, shift_amount = 0;
33430fdc8d8SChris Lattner                  i < byte_size && m_index != UINT32_MAX;
33530fdc8d8SChris Lattner                  ++i, shift_amount += 8)
33630fdc8d8SChris Lattner             {
33730fdc8d8SChris Lattner                 result |= ((uint64_t)GetHexU8() << shift_amount);
33830fdc8d8SChris Lattner             }
33930fdc8d8SChris Lattner         }
34030fdc8d8SChris Lattner         else
34130fdc8d8SChris Lattner         {
34230fdc8d8SChris Lattner             // Big Endian
34330fdc8d8SChris Lattner             for (i = 0; i < byte_size && m_index != UINT32_MAX; ++i)
34430fdc8d8SChris Lattner             {
34530fdc8d8SChris Lattner                 result <<= 8;
34630fdc8d8SChris Lattner                 result |= GetHexU8();
34730fdc8d8SChris Lattner             }
34830fdc8d8SChris Lattner         }
34930fdc8d8SChris Lattner     }
35030fdc8d8SChris Lattner     m_index = UINT32_MAX;
35130fdc8d8SChris Lattner     return fail_value;
35230fdc8d8SChris Lattner }
35330fdc8d8SChris Lattner 
354de9d0494SGreg Clayton size_t
355de9d0494SGreg Clayton StringExtractor::GetHexByteString (std::string &str)
356de9d0494SGreg Clayton {
357de9d0494SGreg Clayton     str.clear();
358de9d0494SGreg Clayton     char ch;
359de9d0494SGreg Clayton     while ((ch = GetHexU8()) != '\0')
360de9d0494SGreg Clayton         str.append(1, ch);
361de9d0494SGreg Clayton     return str.size();
362de9d0494SGreg Clayton }
363de9d0494SGreg Clayton 
36430fdc8d8SChris Lattner bool
36530fdc8d8SChris Lattner StringExtractor::GetNameColonValue (std::string &name, std::string &value)
36630fdc8d8SChris Lattner {
36730fdc8d8SChris Lattner     // Read something in the form of NNNN:VVVV; where NNNN is any character
36830fdc8d8SChris Lattner     // that is not a colon, followed by a ':' character, then a value (one or
36930fdc8d8SChris Lattner     // more ';' chars), followed by a ';'
37030fdc8d8SChris Lattner     if (m_index < m_packet.size())
37130fdc8d8SChris Lattner     {
37230fdc8d8SChris Lattner         const size_t colon_idx = m_packet.find (':', m_index);
37330fdc8d8SChris Lattner         if (colon_idx != std::string::npos)
37430fdc8d8SChris Lattner         {
37530fdc8d8SChris Lattner             const size_t semicolon_idx = m_packet.find (';', colon_idx);
37630fdc8d8SChris Lattner             if (semicolon_idx != std::string::npos)
37730fdc8d8SChris Lattner             {
37830fdc8d8SChris Lattner                 name.assign (m_packet, m_index, colon_idx - m_index);
37930fdc8d8SChris Lattner                 value.assign (m_packet, colon_idx + 1, semicolon_idx - (colon_idx + 1));
38030fdc8d8SChris Lattner                 m_index = semicolon_idx + 1;
38130fdc8d8SChris Lattner                 return true;
38230fdc8d8SChris Lattner             }
38330fdc8d8SChris Lattner         }
38430fdc8d8SChris Lattner     }
38530fdc8d8SChris Lattner     m_index = UINT32_MAX;
38630fdc8d8SChris Lattner     return false;
38730fdc8d8SChris Lattner }
388