130fdc8d8SChris Lattner //===-- StringExtractor.cpp -------------------------------------*- C++ -*-===//
230fdc8d8SChris Lattner //
330fdc8d8SChris Lattner //                     The LLVM Compiler Infrastructure
430fdc8d8SChris Lattner //
530fdc8d8SChris Lattner // This file is distributed under the University of Illinois Open Source
630fdc8d8SChris Lattner // License. See LICENSE.TXT for details.
730fdc8d8SChris Lattner //
830fdc8d8SChris Lattner //===----------------------------------------------------------------------===//
930fdc8d8SChris Lattner 
1030fdc8d8SChris Lattner #include "StringExtractor.h"
1130fdc8d8SChris Lattner 
1230fdc8d8SChris Lattner // C Includes
1330fdc8d8SChris Lattner // C++ Includes
1430fdc8d8SChris Lattner // Other libraries and framework includes
1530fdc8d8SChris Lattner // Project includes
1630fdc8d8SChris Lattner 
1730fdc8d8SChris Lattner static inline int
1830fdc8d8SChris Lattner xdigit_to_sint (char ch)
1930fdc8d8SChris Lattner {
2030fdc8d8SChris Lattner     if (ch >= 'a' && ch <= 'f')
2130fdc8d8SChris Lattner         return 10 + ch - 'a';
22*1e89cd80SBenjamin Kramer     if (ch >= 'A' && ch <= 'F')
23*1e89cd80SBenjamin Kramer         return 10 + ch - 'A';
2430fdc8d8SChris Lattner     return ch - '0';
2530fdc8d8SChris Lattner }
2630fdc8d8SChris Lattner 
2730fdc8d8SChris Lattner static inline unsigned int
2830fdc8d8SChris Lattner xdigit_to_uint (uint8_t ch)
2930fdc8d8SChris Lattner {
3030fdc8d8SChris Lattner     if (ch >= 'a' && ch <= 'f')
3130fdc8d8SChris Lattner         return 10u + ch - 'a';
32*1e89cd80SBenjamin Kramer     if (ch >= 'A' && ch <= 'F')
33*1e89cd80SBenjamin Kramer         return 10u + ch - 'A';
3430fdc8d8SChris Lattner     return ch - '0';
3530fdc8d8SChris Lattner }
3630fdc8d8SChris Lattner 
3730fdc8d8SChris Lattner //----------------------------------------------------------------------
3830fdc8d8SChris Lattner // StringExtractor constructor
3930fdc8d8SChris Lattner //----------------------------------------------------------------------
4030fdc8d8SChris Lattner StringExtractor::StringExtractor() :
4130fdc8d8SChris Lattner     m_packet(),
4230fdc8d8SChris Lattner     m_index (0)
4330fdc8d8SChris Lattner {
4430fdc8d8SChris Lattner }
4530fdc8d8SChris Lattner 
4630fdc8d8SChris Lattner 
4730fdc8d8SChris Lattner StringExtractor::StringExtractor(const char *packet_cstr) :
4830fdc8d8SChris Lattner     m_packet(),
4930fdc8d8SChris Lattner     m_index (0)
5030fdc8d8SChris Lattner {
5130fdc8d8SChris Lattner     if (packet_cstr)
5230fdc8d8SChris Lattner         m_packet.assign (packet_cstr);
5330fdc8d8SChris Lattner }
5430fdc8d8SChris Lattner 
5530fdc8d8SChris Lattner 
5630fdc8d8SChris Lattner //----------------------------------------------------------------------
5730fdc8d8SChris Lattner // StringExtractor copy constructor
5830fdc8d8SChris Lattner //----------------------------------------------------------------------
5930fdc8d8SChris Lattner StringExtractor::StringExtractor(const StringExtractor& rhs) :
6030fdc8d8SChris Lattner     m_packet (rhs.m_packet),
6130fdc8d8SChris Lattner     m_index (rhs.m_index)
6230fdc8d8SChris Lattner {
6330fdc8d8SChris Lattner 
6430fdc8d8SChris Lattner }
6530fdc8d8SChris Lattner 
6630fdc8d8SChris Lattner //----------------------------------------------------------------------
6730fdc8d8SChris Lattner // StringExtractor assignment operator
6830fdc8d8SChris Lattner //----------------------------------------------------------------------
6930fdc8d8SChris Lattner const StringExtractor&
7030fdc8d8SChris Lattner StringExtractor::operator=(const StringExtractor& rhs)
7130fdc8d8SChris Lattner {
7230fdc8d8SChris Lattner     if (this != &rhs)
7330fdc8d8SChris Lattner     {
7430fdc8d8SChris Lattner         m_packet = rhs.m_packet;
7530fdc8d8SChris Lattner         m_index = rhs.m_index;
7630fdc8d8SChris Lattner 
7730fdc8d8SChris Lattner     }
7830fdc8d8SChris Lattner     return *this;
7930fdc8d8SChris Lattner }
8030fdc8d8SChris Lattner 
8130fdc8d8SChris Lattner //----------------------------------------------------------------------
8230fdc8d8SChris Lattner // Destructor
8330fdc8d8SChris Lattner //----------------------------------------------------------------------
8430fdc8d8SChris Lattner StringExtractor::~StringExtractor()
8530fdc8d8SChris Lattner {
8630fdc8d8SChris Lattner }
8730fdc8d8SChris Lattner 
8830fdc8d8SChris Lattner 
8930fdc8d8SChris Lattner char
9030fdc8d8SChris Lattner StringExtractor::GetChar (char fail_value)
9130fdc8d8SChris Lattner {
9230fdc8d8SChris Lattner     if (m_index < m_packet.size())
9330fdc8d8SChris Lattner     {
9430fdc8d8SChris Lattner         char ch = m_packet[m_index];
9530fdc8d8SChris Lattner         ++m_index;
9630fdc8d8SChris Lattner         return ch;
9730fdc8d8SChris Lattner     }
9830fdc8d8SChris Lattner     m_index = UINT32_MAX;
9930fdc8d8SChris Lattner     return fail_value;
10030fdc8d8SChris Lattner }
10130fdc8d8SChris Lattner 
10230fdc8d8SChris Lattner uint32_t
10330fdc8d8SChris Lattner StringExtractor::GetNumHexASCIICharsAtFilePos (uint32_t max) const
10430fdc8d8SChris Lattner {
10530fdc8d8SChris Lattner     uint32_t idx = m_index;
10630fdc8d8SChris Lattner     const size_t size = m_packet.size();
10730fdc8d8SChris Lattner     while (idx < size && idx - m_index < max && isxdigit(m_packet[idx]))
10830fdc8d8SChris Lattner         ++idx;
10930fdc8d8SChris Lattner     return idx - m_index;
11030fdc8d8SChris Lattner }
11130fdc8d8SChris Lattner //----------------------------------------------------------------------
11230fdc8d8SChris Lattner // Extract a signed character from two hex ASCII chars in the packet
11330fdc8d8SChris Lattner // string
11430fdc8d8SChris Lattner //----------------------------------------------------------------------
11530fdc8d8SChris Lattner int8_t
11630fdc8d8SChris Lattner StringExtractor::GetHexS8 (int8_t fail_value)
11730fdc8d8SChris Lattner {
11830fdc8d8SChris Lattner     if (GetNumHexASCIICharsAtFilePos(2))
11930fdc8d8SChris Lattner     {
12030fdc8d8SChris Lattner         char hi_nibble_char = m_packet[m_index];
12130fdc8d8SChris Lattner         char lo_nibble_char = m_packet[m_index+1];
12230fdc8d8SChris Lattner 
12330fdc8d8SChris Lattner         if (isxdigit(hi_nibble_char) && isxdigit(lo_nibble_char))
12430fdc8d8SChris Lattner         {
12530fdc8d8SChris Lattner             char hi_nibble = xdigit_to_sint (hi_nibble_char);
12630fdc8d8SChris Lattner             char lo_nibble = xdigit_to_sint (lo_nibble_char);
12730fdc8d8SChris Lattner             m_index += 2;
12830fdc8d8SChris Lattner             return (hi_nibble << 4) + lo_nibble;
12930fdc8d8SChris Lattner         }
13030fdc8d8SChris Lattner     }
13130fdc8d8SChris Lattner     m_index = UINT32_MAX;
13230fdc8d8SChris Lattner     return fail_value;
13330fdc8d8SChris Lattner }
13430fdc8d8SChris Lattner 
13530fdc8d8SChris Lattner //----------------------------------------------------------------------
13630fdc8d8SChris Lattner // Extract an unsigned character from two hex ASCII chars in the packet
13730fdc8d8SChris Lattner // string
13830fdc8d8SChris Lattner //----------------------------------------------------------------------
13930fdc8d8SChris Lattner uint8_t
14030fdc8d8SChris Lattner StringExtractor::GetHexU8 (uint8_t fail_value)
14130fdc8d8SChris Lattner {
14230fdc8d8SChris Lattner     if (GetNumHexASCIICharsAtFilePos(2))
14330fdc8d8SChris Lattner     {
14430fdc8d8SChris Lattner         uint8_t hi_nibble_char = m_packet[m_index];
14530fdc8d8SChris Lattner         uint8_t lo_nibble_char = m_packet[m_index+1];
14630fdc8d8SChris Lattner 
14730fdc8d8SChris Lattner         if (isxdigit(hi_nibble_char) && isxdigit(lo_nibble_char))
14830fdc8d8SChris Lattner         {
14930fdc8d8SChris Lattner             uint8_t hi_nibble = xdigit_to_sint (hi_nibble_char);
15030fdc8d8SChris Lattner             uint8_t lo_nibble = xdigit_to_sint (lo_nibble_char);
15130fdc8d8SChris Lattner             m_index += 2;
15230fdc8d8SChris Lattner             return (hi_nibble << 4) + lo_nibble;
15330fdc8d8SChris Lattner         }
15430fdc8d8SChris Lattner     }
15530fdc8d8SChris Lattner     m_index = UINT32_MAX;
15630fdc8d8SChris Lattner     return fail_value;
15730fdc8d8SChris Lattner }
15830fdc8d8SChris Lattner 
15930fdc8d8SChris Lattner uint32_t
16030fdc8d8SChris Lattner StringExtractor::GetHexMaxU32 (bool little_endian, uint32_t fail_value)
16130fdc8d8SChris Lattner {
16230fdc8d8SChris Lattner     uint32_t result = 0;
16330fdc8d8SChris Lattner     uint32_t nibble_count = 0;
16430fdc8d8SChris Lattner 
16530fdc8d8SChris Lattner     if (little_endian)
16630fdc8d8SChris Lattner     {
16730fdc8d8SChris Lattner         uint32_t shift_amount = 0;
16830fdc8d8SChris Lattner         while (m_index < m_packet.size() && ::isxdigit (m_packet[m_index]))
16930fdc8d8SChris Lattner         {
17030fdc8d8SChris Lattner             // Make sure we don't exceed the size of a uint32_t...
17130fdc8d8SChris Lattner             if (nibble_count >= (sizeof(uint32_t) * 2))
17230fdc8d8SChris Lattner             {
17330fdc8d8SChris Lattner                 m_index = UINT32_MAX;
17430fdc8d8SChris Lattner                 return fail_value;
17530fdc8d8SChris Lattner             }
17630fdc8d8SChris Lattner 
17730fdc8d8SChris Lattner             uint8_t nibble_lo;
17830fdc8d8SChris Lattner             uint8_t nibble_hi = xdigit_to_sint (m_packet[m_index]);
17930fdc8d8SChris Lattner             ++m_index;
18030fdc8d8SChris Lattner             if (m_index < m_packet.size() && ::isxdigit (m_packet[m_index]))
18130fdc8d8SChris Lattner             {
18230fdc8d8SChris Lattner                 nibble_lo = xdigit_to_sint (m_packet[m_index]);
18330fdc8d8SChris Lattner                 ++m_index;
18430fdc8d8SChris Lattner                 result |= ((uint32_t)nibble_hi << (shift_amount + 4));
18530fdc8d8SChris Lattner                 result |= ((uint32_t)nibble_lo << shift_amount);
18630fdc8d8SChris Lattner                 nibble_count += 2;
18730fdc8d8SChris Lattner                 shift_amount += 8;
18830fdc8d8SChris Lattner             }
18930fdc8d8SChris Lattner             else
19030fdc8d8SChris Lattner             {
19130fdc8d8SChris Lattner                 result |= ((uint32_t)nibble_hi << shift_amount);
19230fdc8d8SChris Lattner                 nibble_count += 1;
19330fdc8d8SChris Lattner                 shift_amount += 4;
19430fdc8d8SChris Lattner             }
19530fdc8d8SChris Lattner 
19630fdc8d8SChris Lattner         }
19730fdc8d8SChris Lattner     }
19830fdc8d8SChris Lattner     else
19930fdc8d8SChris Lattner     {
20030fdc8d8SChris Lattner         while (m_index < m_packet.size() && ::isxdigit (m_packet[m_index]))
20130fdc8d8SChris Lattner         {
20230fdc8d8SChris Lattner             // Make sure we don't exceed the size of a uint32_t...
20330fdc8d8SChris Lattner             if (nibble_count >= (sizeof(uint32_t) * 2))
20430fdc8d8SChris Lattner             {
20530fdc8d8SChris Lattner                 m_index = UINT32_MAX;
20630fdc8d8SChris Lattner                 return fail_value;
20730fdc8d8SChris Lattner             }
20830fdc8d8SChris Lattner 
20930fdc8d8SChris Lattner             uint8_t nibble = xdigit_to_sint (m_packet[m_index]);
21030fdc8d8SChris Lattner             // Big Endian
21130fdc8d8SChris Lattner             result <<= 4;
21230fdc8d8SChris Lattner             result |= nibble;
21330fdc8d8SChris Lattner 
21430fdc8d8SChris Lattner             ++m_index;
21530fdc8d8SChris Lattner             ++nibble_count;
21630fdc8d8SChris Lattner         }
21730fdc8d8SChris Lattner     }
21830fdc8d8SChris Lattner     return result;
21930fdc8d8SChris Lattner }
22030fdc8d8SChris Lattner 
22130fdc8d8SChris Lattner uint64_t
22230fdc8d8SChris Lattner StringExtractor::GetHexMaxU64 (bool little_endian, uint64_t fail_value)
22330fdc8d8SChris Lattner {
22430fdc8d8SChris Lattner     uint64_t result = 0;
22530fdc8d8SChris Lattner     uint32_t nibble_count = 0;
22630fdc8d8SChris Lattner 
22730fdc8d8SChris Lattner     if (little_endian)
22830fdc8d8SChris Lattner     {
22930fdc8d8SChris Lattner         uint32_t shift_amount = 0;
23030fdc8d8SChris Lattner         while (m_index < m_packet.size() && ::isxdigit (m_packet[m_index]))
23130fdc8d8SChris Lattner         {
23230fdc8d8SChris Lattner             // Make sure we don't exceed the size of a uint64_t...
23330fdc8d8SChris Lattner             if (nibble_count >= (sizeof(uint64_t) * 2))
23430fdc8d8SChris Lattner             {
23530fdc8d8SChris Lattner                 m_index = UINT32_MAX;
23630fdc8d8SChris Lattner                 return fail_value;
23730fdc8d8SChris Lattner             }
23830fdc8d8SChris Lattner 
23930fdc8d8SChris Lattner             uint8_t nibble_lo;
24030fdc8d8SChris Lattner             uint8_t nibble_hi = xdigit_to_sint (m_packet[m_index]);
24130fdc8d8SChris Lattner             ++m_index;
24230fdc8d8SChris Lattner             if (m_index < m_packet.size() && ::isxdigit (m_packet[m_index]))
24330fdc8d8SChris Lattner             {
24430fdc8d8SChris Lattner                 nibble_lo = xdigit_to_sint (m_packet[m_index]);
24530fdc8d8SChris Lattner                 ++m_index;
24630fdc8d8SChris Lattner                 result |= ((uint64_t)nibble_hi << (shift_amount + 4));
24730fdc8d8SChris Lattner                 result |= ((uint64_t)nibble_lo << shift_amount);
24830fdc8d8SChris Lattner                 nibble_count += 2;
24930fdc8d8SChris Lattner                 shift_amount += 8;
25030fdc8d8SChris Lattner             }
25130fdc8d8SChris Lattner             else
25230fdc8d8SChris Lattner             {
25330fdc8d8SChris Lattner                 result |= ((uint64_t)nibble_hi << shift_amount);
25430fdc8d8SChris Lattner                 nibble_count += 1;
25530fdc8d8SChris Lattner                 shift_amount += 4;
25630fdc8d8SChris Lattner             }
25730fdc8d8SChris Lattner 
25830fdc8d8SChris Lattner         }
25930fdc8d8SChris Lattner     }
26030fdc8d8SChris Lattner     else
26130fdc8d8SChris Lattner     {
26230fdc8d8SChris Lattner         while (m_index < m_packet.size() && ::isxdigit (m_packet[m_index]))
26330fdc8d8SChris Lattner         {
26430fdc8d8SChris Lattner             // Make sure we don't exceed the size of a uint64_t...
26530fdc8d8SChris Lattner             if (nibble_count >= (sizeof(uint64_t) * 2))
26630fdc8d8SChris Lattner             {
26730fdc8d8SChris Lattner                 m_index = UINT32_MAX;
26830fdc8d8SChris Lattner                 return fail_value;
26930fdc8d8SChris Lattner             }
27030fdc8d8SChris Lattner 
27130fdc8d8SChris Lattner             uint8_t nibble = xdigit_to_sint (m_packet[m_index]);
27230fdc8d8SChris Lattner             // Big Endian
27330fdc8d8SChris Lattner             result <<= 4;
27430fdc8d8SChris Lattner             result |= nibble;
27530fdc8d8SChris Lattner 
27630fdc8d8SChris Lattner             ++m_index;
27730fdc8d8SChris Lattner             ++nibble_count;
27830fdc8d8SChris Lattner         }
27930fdc8d8SChris Lattner     }
28030fdc8d8SChris Lattner     return result;
28130fdc8d8SChris Lattner }
28230fdc8d8SChris Lattner 
28330fdc8d8SChris Lattner size_t
28430fdc8d8SChris Lattner StringExtractor::GetHexBytes (void *dst_void, size_t dst_len, uint8_t fail_fill_value)
28530fdc8d8SChris Lattner {
28630fdc8d8SChris Lattner     uint8_t *dst = (uint8_t*)dst_void;
28730fdc8d8SChris Lattner     size_t bytes_extracted = 0;
28830fdc8d8SChris Lattner     while (bytes_extracted < dst_len && GetBytesLeft ())
28930fdc8d8SChris Lattner     {
29030fdc8d8SChris Lattner         dst[bytes_extracted] = GetHexU8 (fail_fill_value);
29130fdc8d8SChris Lattner         if (IsGood())
29230fdc8d8SChris Lattner             ++bytes_extracted;
29330fdc8d8SChris Lattner         else
29430fdc8d8SChris Lattner             break;
29530fdc8d8SChris Lattner     }
29630fdc8d8SChris Lattner 
29730fdc8d8SChris Lattner     for (size_t i = bytes_extracted; i < dst_len; ++i)
29830fdc8d8SChris Lattner         dst[i] = fail_fill_value;
29930fdc8d8SChris Lattner 
30030fdc8d8SChris Lattner     return bytes_extracted;
30130fdc8d8SChris Lattner }
30230fdc8d8SChris Lattner 
30330fdc8d8SChris Lattner 
30430fdc8d8SChris Lattner // Consume ASCII hex nibble character pairs until we have decoded byte_size
30530fdc8d8SChris Lattner // bytes of data.
30630fdc8d8SChris Lattner 
30730fdc8d8SChris Lattner uint64_t
30830fdc8d8SChris Lattner StringExtractor::GetHexWithFixedSize (uint32_t byte_size, bool little_endian, uint64_t fail_value)
30930fdc8d8SChris Lattner {
31030fdc8d8SChris Lattner     if (byte_size <= 8 && GetBytesLeft() >= byte_size * 2)
31130fdc8d8SChris Lattner     {
31230fdc8d8SChris Lattner         uint64_t result = 0;
31330fdc8d8SChris Lattner         uint32_t i;
31430fdc8d8SChris Lattner         if (little_endian)
31530fdc8d8SChris Lattner         {
31630fdc8d8SChris Lattner             // Little Endian
31730fdc8d8SChris Lattner             uint32_t shift_amount;
31830fdc8d8SChris Lattner             for (i = 0, shift_amount = 0;
31930fdc8d8SChris Lattner                  i < byte_size && m_index != UINT32_MAX;
32030fdc8d8SChris Lattner                  ++i, shift_amount += 8)
32130fdc8d8SChris Lattner             {
32230fdc8d8SChris Lattner                 result |= ((uint64_t)GetHexU8() << shift_amount);
32330fdc8d8SChris Lattner             }
32430fdc8d8SChris Lattner         }
32530fdc8d8SChris Lattner         else
32630fdc8d8SChris Lattner         {
32730fdc8d8SChris Lattner             // Big Endian
32830fdc8d8SChris Lattner             for (i = 0; i < byte_size && m_index != UINT32_MAX; ++i)
32930fdc8d8SChris Lattner             {
33030fdc8d8SChris Lattner                 result <<= 8;
33130fdc8d8SChris Lattner                 result |= GetHexU8();
33230fdc8d8SChris Lattner             }
33330fdc8d8SChris Lattner         }
33430fdc8d8SChris Lattner     }
33530fdc8d8SChris Lattner     m_index = UINT32_MAX;
33630fdc8d8SChris Lattner     return fail_value;
33730fdc8d8SChris Lattner }
33830fdc8d8SChris Lattner 
33930fdc8d8SChris Lattner bool
34030fdc8d8SChris Lattner StringExtractor::GetNameColonValue (std::string &name, std::string &value)
34130fdc8d8SChris Lattner {
34230fdc8d8SChris Lattner     // Read something in the form of NNNN:VVVV; where NNNN is any character
34330fdc8d8SChris Lattner     // that is not a colon, followed by a ':' character, then a value (one or
34430fdc8d8SChris Lattner     // more ';' chars), followed by a ';'
34530fdc8d8SChris Lattner     if (m_index < m_packet.size())
34630fdc8d8SChris Lattner     {
34730fdc8d8SChris Lattner         const size_t colon_idx = m_packet.find (':', m_index);
34830fdc8d8SChris Lattner         if (colon_idx != std::string::npos)
34930fdc8d8SChris Lattner         {
35030fdc8d8SChris Lattner             const size_t semicolon_idx = m_packet.find (';', colon_idx);
35130fdc8d8SChris Lattner             if (semicolon_idx != std::string::npos)
35230fdc8d8SChris Lattner             {
35330fdc8d8SChris Lattner                 name.assign (m_packet, m_index, colon_idx - m_index);
35430fdc8d8SChris Lattner                 value.assign (m_packet, colon_idx + 1, semicolon_idx - (colon_idx + 1));
35530fdc8d8SChris Lattner                 m_index = semicolon_idx + 1;
35630fdc8d8SChris Lattner                 return true;
35730fdc8d8SChris Lattner             }
35830fdc8d8SChris Lattner         }
35930fdc8d8SChris Lattner     }
36030fdc8d8SChris Lattner     m_index = UINT32_MAX;
36130fdc8d8SChris Lattner     return false;
36230fdc8d8SChris Lattner }
363