LLVM: lib/Support/JSON.cpp Source File

//=== JSON.cpp - JSON value, parsing and serialization - C++ -----------*-===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===---------------------------------------------------------------------===//


#include "llvm/Support/JSON.h"

#include "llvm/ADT/STLExtras.h"

#include "llvm/ADT/StringExtras.h"

#include "llvm/Support/ConvertUTF.h"

#include "llvm/Support/Error.h"

#include "llvm/Support/Format.h"

#include "llvm/Support/NativeFormatting.h"

#include "llvm/Support/raw_ostream.h"

#include <cctype>

#include <cerrno>

#include <optional>


namespace llvm {

namespace json {


Value &Object::operator[](const ObjectKey &K) {

  return try_emplace(K, nullptr).first->getSecond();

}


Value &Object::operator[](ObjectKey &&K) {

  return try_emplace(std::move(K), nullptr).first->getSecond();

}


Value *Object::get(StringRef K) {

  auto I = find(K);

  if (I == end())

    return nullptr;

  return &I->second;

}


const Value *Object::get(StringRef K) const {

  auto I = find(K);

  if (I == end())

    return nullptr;

  return &I->second;

}


std::optional<std::nullptr_t> Object::getNull(StringRef K) const {

  if (auto *V = get(K))

    return V->getAsNull();

  return std::nullopt;

}


std::optional<bool> Object::getBoolean(StringRef K) const {

  if (auto *V = get(K))

    return V->getAsBoolean();

  return std::nullopt;

}


std::optional<double> Object::getNumber(StringRef K) const {

  if (auto *V = get(K))

    return V->getAsNumber();

  return std::nullopt;

}


std::optional<int64_t> Object::getInteger(StringRef K) const {

  if (auto *V = get(K))

    return V->getAsInteger();

  return std::nullopt;

}


std::optional<llvm::StringRef> Object::getString(StringRef K) const {

  if (auto *V = get(K))

    return V->getAsString();

  return std::nullopt;

}


const json::Object *Object::getObject(StringRef K) const {

  if (auto *V = get(K))

    return V->getAsObject();

  return nullptr;

}


json::Object *Object::getObject(StringRef K) {

  if (auto *V = get(K))

    return V->getAsObject();

  return nullptr;

}


const json::Array *Object::getArray(StringRef K) const {

  if (auto *V = get(K))

    return V->getAsArray();

  return nullptr;

}


json::Array *Object::getArray(StringRef K) {

  if (auto *V = get(K))

    return V->getAsArray();

  return nullptr;

}


bool operator==(const Object &LHS, const Object &RHS) { return LHS.M == RHS.M; }


Array::Array(std::initializer_list<Value> Elements) {

  V.reserve(Elements.size());

  for (const Value &V : Elements) {

    emplace_back(nullptr);

    back().moveFrom(std::move(V));

  }

}


Value::Value(std::initializer_list<Value> Elements)

    : Value(json::Array(Elements)) {}


void Value::copyFrom(const Value &M) {

  Type = M.Type;

  switch (Type) {

  case T_Null:

  case T_Boolean:

  case T_Double:

  case T_Integer:

  case T_UINT64:

    memcpy(&Union, &M.Union, sizeof(Union));

    break;

  case T_StringRef:

    create<StringRef>(M.as<StringRef>());

    break;

  case T_String:

    create<std::string>(M.as<std::string>());

    break;

  case T_Object:

    create<json::Object>(M.as<json::Object>());

    break;

  case T_Array:

    create<json::Array>(M.as<json::Array>());

    break;

  }

}


void Value::moveFrom(const Value &&M) {

  Type = M.Type;

  switch (Type) {

  case T_Null:

  case T_Boolean:

  case T_Double:

  case T_Integer:

  case T_UINT64:

    memcpy(&Union, &M.Union, sizeof(Union));

    break;

  case T_StringRef:

    create<StringRef>(M.as<StringRef>());

    break;

  case T_String:

    create<std::string>(std::move(M.as<std::string>()));

    M.Type = T_Null;

    break;

  case T_Object:

    create<json::Object>(std::move(M.as<json::Object>()));

    M.Type = T_Null;

    break;

  case T_Array:

    create<json::Array>(std::move(M.as<json::Array>()));

    M.Type = T_Null;

    break;

  }

}


void Value::destroy() {

  switch (Type) {

  case T_Null:

  case T_Boolean:

  case T_Double:

  case T_Integer:

  case T_UINT64:

    break;

  case T_StringRef:

    as<StringRef>().~StringRef();

    break;

  case T_String:

    as<std::string>().~basic_string();

    break;

  case T_Object:

    as<json::Object>().~Object();

    break;

  case T_Array:

    as<json::Array>().~Array();

    break;

  }

}


void Value::print(llvm::raw_ostream &OS) const { OS << *this; }


bool operator==(const Value &L, const Value &R) {

  if (L.kind() != R.kind())

    return false;

  switch (L.kind()) {

  case Value::Null:

    return *L.getAsNull() == *R.getAsNull();

  case Value::Boolean:

    return *L.getAsBoolean() == *R.getAsBoolean();

  case Value::Number:

    // Workaround for https://gcc.gnu.org/bugzilla/show_bug.cgi?id=323

    // The same integer must convert to the same double, per the standard.

    // However we see 64-vs-80-bit precision comparisons with gcc-7 -O3 -m32.

    // So we avoid floating point promotion for exact comparisons.

    if (L.Type == Value::T_Integer || R.Type == Value::T_Integer)

      return L.getAsInteger() == R.getAsInteger();

    return *L.getAsNumber() == *R.getAsNumber();

  case Value::String:

    return *L.getAsString() == *R.getAsString();

  case Value::Array:

    return *L.getAsArray() == *R.getAsArray();

  case Value::Object:

    return *L.getAsObject() == *R.getAsObject();

  }

  llvm_unreachable("Unknown value kind");

}


void Path::report(llvm::StringLiteral Msg) {

  // Walk up to the root context, and count the number of segments.

  unsigned Count = 0;

  const Path *P;

  for (P = this; P->Parent != nullptr; P = P->Parent)

    ++Count;

  Path::Root *R = P->Seg.root();

  // Fill in the error message and copy the path (in reverse order).

  R->ErrorMessage = Msg;

  R->ErrorPath.resize(Count);

  auto It = R->ErrorPath.begin();

  for (P = this; P->Parent != nullptr; P = P->Parent)

    *It++ = P->Seg;

}


Error Path::Root::getError() const {

  std::string S;

  raw_string_ostream OS(S);

  OS << (ErrorMessage.empty() ? "invalid JSON contents" : ErrorMessage);

  if (ErrorPath.empty()) {

    if (!Name.empty())

      OS << " when parsing " << Name;

  } else {

    OS << " at " << (Name.empty() ? "(root)" : Name);

    for (const Path::Segment &S : llvm::reverse(ErrorPath)) {

      if (S.isField())

        OS << '.' << S.field();

      else

        OS << '[' << S.index() << ']';

    }

  }

  return createStringError(llvm::inconvertibleErrorCode(), S);

}


std::vector<const Object::value_type *> sortedElements(const Object &O) {

  std::vector<const Object::value_type *> Elements;

  for (const auto &E : O)

    Elements.push_back(&E);

  llvm::sort(Elements,

             [](const Object::value_type *L, const Object::value_type *R) {

               return L->first < R->first;

             });

  return Elements;

}


// Prints a one-line version of a value that isn't our main focus.

// We interleave writes to OS and JOS, exploiting the lack of extra buffering.

// This is OK as we own the implementation.


static void abbreviate(const Value &V, OStream &JOS) {

  switch (V.kind()) {

  case Value::Array:

    JOS.rawValue(V.getAsArray()->empty() ? "[]" : "[ ... ]");

    break;

  case Value::Object:

    JOS.rawValue(V.getAsObject()->empty() ? "{}" : "{ ... }");

    break;

  case Value::String: {

    llvm::StringRef S = *V.getAsString();

    if (S.size() < 40) {

      JOS.value(V);

    } else {

      std::string Truncated = fixUTF8(S.take_front(37));

      Truncated.append("...");

      JOS.value(Truncated);

    }

    break;

  }

  default:

    JOS.value(V);

  }

}


// Prints a semi-expanded version of a value that is our main focus.

// Array/Object entries are printed, but not recursively as they may be huge.


static void abbreviateChildren(const Value &V, OStream &JOS) {

  switch (V.kind()) {

  case Value::Array:

    JOS.array([&] {

      for (const auto &I : *V.getAsArray())

        abbreviate(I, JOS);

    });

    break;

  case Value::Object:

    JOS.object([&] {

      for (const auto *KV : sortedElements(*V.getAsObject())) {

        JOS.attributeBegin(KV->first);

        abbreviate(KV->second, JOS);

        JOS.attributeEnd();

      }

    });

    break;

  default:

    JOS.value(V);

  }

}


void Path::Root::printErrorContext(const Value &R, raw_ostream &OS) const {

  OStream JOS(OS, /*IndentSize=*/2);

  // PrintValue recurses down the path, printing the ancestors of our target.

  // Siblings of nodes along the path are printed with abbreviate(), and the

  // target itself is printed with the somewhat richer abbreviateChildren().

  // 'Recurse' is the lambda itself, to allow recursive calls.

  auto PrintValue = [&](const Value &V, ArrayRef<Segment> Path, auto &Recurse) {

    // Print the target node itself, with the error as a comment.

    // Also used if we can't follow our path, e.g. it names a field that

    // *should* exist but doesn't.

    auto HighlightCurrent = [&] {

      std::string Comment = "error: ";

      Comment.append(ErrorMessage.data(), ErrorMessage.size());

      JOS.comment(Comment);

      abbreviateChildren(V, JOS);

    };

    if (Path.empty()) // We reached our target.

      return HighlightCurrent();

    const Segment &S = Path.back(); // Path is in reverse order.

    if (S.isField()) {

      // Current node is an object, path names a field.

      llvm::StringRef FieldName = S.field();

      const Object *O = V.getAsObject();

      if (!O || !O->get(FieldName))

        return HighlightCurrent();

      JOS.object([&] {

        for (const auto *KV : sortedElements(*O)) {

          JOS.attributeBegin(KV->first);

          if (FieldName == StringRef(KV->first))

            Recurse(KV->second, Path.drop_back(), Recurse);

          else

            abbreviate(KV->second, JOS);

          JOS.attributeEnd();

        }

      });

    } else {

      // Current node is an array, path names an element.

      const Array *A = V.getAsArray();

      if (!A || S.index() >= A->size())

        return HighlightCurrent();

      JOS.array([&] {

        unsigned Current = 0;

        for (const auto &V : *A) {

          if (Current++ == S.index())

            Recurse(V, Path.drop_back(), Recurse);

          else

            abbreviate(V, JOS);

        }

      });

    }

  };

  PrintValue(R, ErrorPath, PrintValue);

}


namespace {

// Simple recursive-descent JSON parser.

class Parser {

public:

  Parser(StringRef JSON)

      : Start(JSON.begin()), P(JSON.begin()), End(JSON.end()) {}


  bool checkUTF8() {

    size_t ErrOffset;

    if (isUTF8(StringRef(Start, End - Start), &ErrOffset))

      return true;

    P = Start + ErrOffset; // For line/column calculation.

    return parseError("Invalid UTF-8 sequence");

  }


  bool parseValue(Value &Out);


  bool assertEnd() {

    eatWhitespace();

    if (P == End)

      return true;

    return parseError("Text after end of document");

  }


  Error takeError() {

    assert(Err);

    return std::move(*Err);

  }


private:

  void eatWhitespace() {

    while (P != End && (*P == ' ' || *P == '\r' || *P == '\n' || *P == '\t'))

      ++P;

  }


  // On invalid syntax, parseX() functions return false and set Err.

  bool parseNumber(char First, Value &Out);

  bool parseString(std::string &Out);

  bool parseUnicode(std::string &Out);

  bool parseError(const char *Msg); // always returns false


  char next() { return P == End ? 0 : *P++; }

  char peek() { return P == End ? 0 : *P; }

  static bool isNumber(char C) {

    return C == '0' || C == '1' || C == '2' || C == '3' || C == '4' ||

           C == '5' || C == '6' || C == '7' || C == '8' || C == '9' ||

           C == 'e' || C == 'E' || C == '+' || C == '-' || C == '.';

  }


  std::optional<Error> Err;

  const char *Start, *P, *End;

};

} // namespace


bool Parser::parseValue(Value &Out) {

  eatWhitespace();

  if (P == End)

    return parseError("Unexpected EOF");

  switch (char C = next()) {

  // Bare null/true/false are easy - first char identifies them.

  case 'n':

    Out = nullptr;

    return (next() == 'u' && next() == 'l' && next() == 'l') ||

           parseError("Invalid JSON value (null?)");

  case 't':

    Out = true;

    return (next() == 'r' && next() == 'u' && next() == 'e') ||

           parseError("Invalid JSON value (true?)");

  case 'f':

    Out = false;

    return (next() == 'a' && next() == 'l' && next() == 's' && next() == 'e') ||

           parseError("Invalid JSON value (false?)");

  case '"': {

    std::string S;

    if (parseString(S)) {

      Out = std::move(S);

      return true;

    }

    return false;

  }

  case '[': {

    Out = Array{};

    Array &A = *Out.getAsArray();

    eatWhitespace();

    if (peek() == ']') {

      ++P;

      return true;

    }

    for (;;) {

      A.emplace_back(nullptr);

      if (!parseValue(A.back()))

        return false;

      eatWhitespace();

      switch (next()) {

      case ',':

        eatWhitespace();

        continue;

      case ']':

        return true;

      default:

        return parseError("Expected , or ] after array element");

      }

    }

  }

  case '{': {

    Out = Object{};

    Object &O = *Out.getAsObject();

    eatWhitespace();

    if (peek() == '}') {

      ++P;

      return true;

    }

    for (;;) {

      if (next() != '"')

        return parseError("Expected object key");

      std::string K;

      if (!parseString(K))

        return false;

      eatWhitespace();

      if (next() != ':')

        return parseError("Expected : after object key");

      eatWhitespace();

      if (!parseValue(O[std::move(K)]))

        return false;

      eatWhitespace();

      switch (next()) {

      case ',':

        eatWhitespace();

        continue;

      case '}':

        return true;

      default:

        return parseError("Expected , or } after object property");

      }

    }

  }

  default:

    if (isNumber(C))

      return parseNumber(C, Out);

    return parseError("Invalid JSON value");

  }

}


bool Parser::parseNumber(char First, Value &Out) {

  // Read the number into a string. (Must be null-terminated for strto*).

  SmallString<24> S;

  S.push_back(First);

  while (isNumber(peek()))

    S.push_back(next());

  char *End;

  // Try first to parse as integer, and if so preserve full 64 bits.

  // We check for errno for out of bounds errors and for End == S.end()

  // to make sure that the numeric string is not malformed.

  errno = 0;

  int64_t I = std::strtoll(S.c_str(), &End, 10);

  if (End == S.end() && errno != ERANGE) {

    Out = I;

    return true;

  }

  // strtroull has a special handling for negative numbers, but in this

  // case we don't want to do that because negative numbers were already

  // handled in the previous block.

  if (First != '-') {

    errno = 0;

    uint64_t UI = std::strtoull(S.c_str(), &End, 10);

    if (End == S.end() && errno != ERANGE) {

      Out = UI;

      return true;

    }

  }

  // If it's not an integer

  Out = std::strtod(S.c_str(), &End);

  return End == S.end() || parseError("Invalid JSON value (number?)");

}


bool Parser::parseString(std::string &Out) {

  // leading quote was already consumed.

  for (char C = next(); C != '"'; C = next()) {

    if (LLVM_UNLIKELY(P == End))

      return parseError("Unterminated string");

    if (LLVM_UNLIKELY((C & 0x1f) == C))

      return parseError("Control character in string");

    if (LLVM_LIKELY(C != '\\')) {

      Out.push_back(C);

      continue;

    }

    // Handle escape sequence.

    switch (C = next()) {

    case '"':

    case '\\':

    case '/':

      Out.push_back(C);

      break;

    case 'b':

      Out.push_back('\b');

      break;

    case 'f':

      Out.push_back('\f');

      break;

    case 'n':

      Out.push_back('\n');

      break;

    case 'r':

      Out.push_back('\r');

      break;

    case 't':

      Out.push_back('\t');

      break;

    case 'u':

      if (!parseUnicode(Out))

        return false;

      break;

    default:

      return parseError("Invalid escape sequence");

    }

  }

  return true;

}


static void encodeUtf8(uint32_t Rune, std::string &Out) {

  if (Rune < 0x80) {

    Out.push_back(Rune & 0x7F);

  } else if (Rune < 0x800) {

    uint8_t FirstByte = 0xC0 | ((Rune & 0x7C0) >> 6);

    uint8_t SecondByte = 0x80 | (Rune & 0x3F);

    Out.push_back(FirstByte);

    Out.push_back(SecondByte);

  } else if (Rune < 0x10000) {

    uint8_t FirstByte = 0xE0 | ((Rune & 0xF000) >> 12);

    uint8_t SecondByte = 0x80 | ((Rune & 0xFC0) >> 6);

    uint8_t ThirdByte = 0x80 | (Rune & 0x3F);

    Out.push_back(FirstByte);

    Out.push_back(SecondByte);

    Out.push_back(ThirdByte);

  } else if (Rune < 0x110000) {

    uint8_t FirstByte = 0xF0 | ((Rune & 0x1F0000) >> 18);

    uint8_t SecondByte = 0x80 | ((Rune & 0x3F000) >> 12);

    uint8_t ThirdByte = 0x80 | ((Rune & 0xFC0) >> 6);

    uint8_t FourthByte = 0x80 | (Rune & 0x3F);

    Out.push_back(FirstByte);

    Out.push_back(SecondByte);

    Out.push_back(ThirdByte);

    Out.push_back(FourthByte);

  } else {

    llvm_unreachable("Invalid codepoint");

  }

}


// Parse a UTF-16 \uNNNN escape sequence. "\u" has already been consumed.

// May parse several sequential escapes to ensure proper surrogate handling.

// We do not use ConvertUTF.h, it can't accept and replace unpaired surrogates.

// These are invalid Unicode but valid JSON (RFC 8259, section 8.2).

bool Parser::parseUnicode(std::string &Out) {

  // Invalid UTF is not a JSON error (RFC 8529§8.2). It gets replaced by U+FFFD.

  auto Invalid = [&] { Out.append(/* UTF-8 */ {'\xef', '\xbf', '\xbd'}); };

  // Decodes 4 hex digits from the stream into Out, returns false on error.

  auto Parse4Hex = [this](uint16_t &Out) -> bool {

    Out = 0;

    char Bytes[] = {next(), next(), next(), next()};

    for (unsigned char C : Bytes) {

      if (!std::isxdigit(C))

        return parseError("Invalid \\u escape sequence");

      Out <<= 4;

      Out |= (C > '9') ? (C & ~0x20) - 'A' + 10 : (C - '0');

    }

    return true;

  };

  uint16_t First; // UTF-16 code unit from the first \u escape.

  if (!Parse4Hex(First))

    return false;


  // We loop to allow proper surrogate-pair error handling.

  while (true) {

    // Case 1: the UTF-16 code unit is already a codepoint in the BMP.

    if (LLVM_LIKELY(First < 0xD800 || First >= 0xE000)) {

      encodeUtf8(First, Out);

      return true;

    }


    // Case 2: it's an (unpaired) trailing surrogate.

    if (LLVM_UNLIKELY(First >= 0xDC00)) {

      Invalid();

      return true;

    }


    // Case 3: it's a leading surrogate. We expect a trailing one next.

    // Case 3a: there's no trailing \u escape. Don't advance in the stream.

    if (LLVM_UNLIKELY(P + 2 > End || *P != '\\' || *(P + 1) != 'u')) {

      Invalid(); // Leading surrogate was unpaired.

      return true;

    }

    P += 2;

    uint16_t Second;

    if (!Parse4Hex(Second))

      return false;

    // Case 3b: there was another \u escape, but it wasn't a trailing surrogate.

    if (LLVM_UNLIKELY(Second < 0xDC00 || Second >= 0xE000)) {

      Invalid();      // Leading surrogate was unpaired.

      First = Second; // Second escape still needs to be processed.

      continue;

    }

    // Case 3c: a valid surrogate pair encoding an astral codepoint.

    encodeUtf8(0x10000 | ((First - 0xD800) << 10) | (Second - 0xDC00), Out);

    return true;

  }

}


bool Parser::parseError(const char *Msg) {

  int Line = 1;

  const char *StartOfLine = Start;

  for (const char *X = Start; X < P; ++X) {

    if (*X == 0x0A) {

      ++Line;

      StartOfLine = X + 1;

    }

  }

  Err.emplace(

      std::make_unique<ParseError>(Msg, Line, P - StartOfLine, P - Start));

  return false;

}


Expected<Value> parse(StringRef JSON) {

  Parser P(JSON);

  Value E = nullptr;

  if (P.checkUTF8())

    if (P.parseValue(E))

      if (P.assertEnd())

        return std::move(E);

  return P.takeError();

}


char ParseError::ID = 0;


bool isUTF8(llvm::StringRef S, size_t *ErrOffset) {

  // Fast-path for ASCII, which is valid UTF-8.

  if (LLVM_LIKELY(isASCII(S)))

    return true;


  const UTF8 *Data = reinterpret_cast<const UTF8 *>(S.data()), *Rest = Data;

  if (LLVM_LIKELY(isLegalUTF8String(&Rest, Data + S.size())))

    return true;


  if (ErrOffset)

    *ErrOffset = Rest - Data;

  return false;

}


std::string fixUTF8(llvm::StringRef S) {

  // This isn't particularly efficient, but is only for error-recovery.

  std::vector<UTF32> Codepoints(S.size()); // 1 codepoint per byte suffices.

  const UTF8 *In8 = reinterpret_cast<const UTF8 *>(S.data());

  UTF32 *Out32 = Codepoints.data();

  ConvertUTF8toUTF32(&In8, In8 + S.size(), &Out32, Out32 + Codepoints.size(),

                     lenientConversion);

  Codepoints.resize(Out32 - Codepoints.data());

  std::string Res(4 * Codepoints.size(), 0); // 4 bytes per codepoint suffice

  const UTF32 *In32 = Codepoints.data();

  UTF8 *Out8 = reinterpret_cast<UTF8 *>(&Res[0]);

  ConvertUTF32toUTF8(&In32, In32 + Codepoints.size(), &Out8, Out8 + Res.size(),

                     strictConversion);

  Res.resize(reinterpret_cast<char *>(Out8) - Res.data());

  return Res;

}


static void quote(llvm::raw_ostream &OS, llvm::StringRef S) {

  OS << '\"';

  for (unsigned char C : S) {

    if (C == 0x22 || C == 0x5C)

      OS << '\\';

    if (C >= 0x20) {

      OS << C;

      continue;

    }

    OS << '\\';

    switch (C) {

    // A few characters are common enough to make short escapes worthwhile.

    case '\t':

      OS << 't';

      break;

    case '\n':

      OS << 'n';

      break;

    case '\r':

      OS << 'r';

      break;

    default:

      OS << 'u';

      llvm::write_hex(OS, C, llvm::HexPrintStyle::Lower, 4);

      break;

    }

  }

  OS << '\"';

}


void llvm::json::OStream::value(const Value &V) {

  switch (V.kind()) {

  case Value::Null:

    valueBegin();

    OS << "null";

    return;

  case Value::Boolean:

    valueBegin();

    OS << (*V.getAsBoolean() ? "true" : "false");

    return;

  case Value::Number:

    valueBegin();

    if (V.Type == Value::T_Integer)

      OS << *V.getAsInteger();

    else if (V.Type == Value::T_UINT64)

      OS << *V.getAsUINT64();

    else

      OS << format("%.*g", std::numeric_limits<double>::max_digits10,

                   *V.getAsNumber());

    return;

  case Value::String:

    valueBegin();

    quote(OS, *V.getAsString());

    return;

  case Value::Array:

    return array([&] {

      for (const Value &E : *V.getAsArray())

        value(E);

    });

  case Value::Object:

    return object([&] {

      for (const Object::value_type *E : sortedElements(*V.getAsObject()))

        attribute(E->first, E->second);

    });

  }

}


void llvm::json::OStream::valueBegin() {

  assert(Stack.back().Ctx != Object && "Only attributes allowed here");

  if (Stack.back().HasValue) {

    assert(Stack.back().Ctx != Singleton && "Only one value allowed here");

    OS << ',';

  }

  if (Stack.back().Ctx == Array)

    newline();

  flushComment();

  Stack.back().HasValue = true;

}


void OStream::comment(llvm::StringRef Comment) {

  assert(PendingComment.empty() && "Only one comment per value!");

  PendingComment = Comment;

}


void OStream::flushComment() {

  if (PendingComment.empty())

    return;

  OS << (IndentSize ? "/* " : "/*");

  // Be sure not to accidentally emit "*/". Transform to "* /".

  while (!PendingComment.empty()) {

    auto Pos = PendingComment.find("*/");

    if (Pos == StringRef::npos) {

      OS << PendingComment;

      PendingComment = "";

    } else {

      OS << PendingComment.take_front(Pos) << "* /";

      PendingComment = PendingComment.drop_front(Pos + 2);

    }

  }

  OS << (IndentSize ? " */" : "*/");

  // Comments are on their own line unless attached to an attribute value.

  if (Stack.size() > 1 && Stack.back().Ctx == Singleton) {

    if (IndentSize)

      OS << ' ';

  } else {

    newline();

  }

}


void llvm::json::OStream::newline() {

  if (IndentSize) {

    OS.write('\n');

    OS.indent(Indent);

  }

}


void llvm::json::OStream::arrayBegin() {

  valueBegin();

  Stack.emplace_back();

  Stack.back().Ctx = Array;

  Indent += IndentSize;

  OS << '[';

}


void llvm::json::OStream::arrayEnd() {

  assert(Stack.back().Ctx == Array);

  Indent -= IndentSize;

  if (Stack.back().HasValue)

    newline();

  OS << ']';

  assert(PendingComment.empty());

  Stack.pop_back();

  assert(!Stack.empty());

}


void llvm::json::OStream::objectBegin() {

  valueBegin();

  Stack.emplace_back();

  Stack.back().Ctx = Object;

  Indent += IndentSize;

  OS << '{';

}


void llvm::json::OStream::objectEnd() {

  assert(Stack.back().Ctx == Object);

  Indent -= IndentSize;

  if (Stack.back().HasValue)

    newline();

  OS << '}';

  assert(PendingComment.empty());

  Stack.pop_back();

  assert(!Stack.empty());

}


void llvm::json::OStream::attributeBegin(llvm::StringRef Key) {

  assert(Stack.back().Ctx == Object);

  if (Stack.back().HasValue)

    OS << ',';

  newline();

  flushComment();

  Stack.back().HasValue = true;

  Stack.emplace_back();

  Stack.back().Ctx = Singleton;

  if (LLVM_LIKELY(isUTF8(Key))) {

    quote(OS, Key);

  } else {

    assert(false && "Invalid UTF-8 in attribute key");

    quote(OS, fixUTF8(Key));

  }

  OS.write(':');

  if (IndentSize)

    OS.write(' ');

}


void llvm::json::OStream::attributeEnd() {

  assert(Stack.back().Ctx == Singleton);

  assert(Stack.back().HasValue && "Attribute must have a value");

  assert(PendingComment.empty());

  Stack.pop_back();

  assert(Stack.back().Ctx == Object);

}


raw_ostream &llvm::json::OStream::rawValueBegin() {

  valueBegin();

  Stack.emplace_back();

  Stack.back().Ctx = RawValue;

  return OS;

}


void llvm::json::OStream::rawValueEnd() {

  assert(Stack.back().Ctx == RawValue);

  Stack.pop_back();

}


} // namespace json

} // namespace llvm


void llvm::format_provider<llvm::json::Value>::format(

    const llvm::json::Value &E, raw_ostream &OS, StringRef Options) {

  unsigned IndentAmount = 0;

  if (!Options.empty() && Options.getAsInteger(/*Radix=*/10, IndentAmount))

    llvm_unreachable("json::Value format options should be an integer");

  json::OStream(OS, IndentAmount).value(E);

}


assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

C
static GCRegistry::Add< ShadowStackGC > C("shadow-stack", "Very portable GC for uncooperative code generators")

A
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")

E
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")

LLVM_UNLIKELY
#define LLVM_UNLIKELY(EXPR)
Definition Compiler.h:336

LLVM_LIKELY
#define LLVM_LIKELY(EXPR)
Definition Compiler.h:335

ConvertUTF.h

Format.h

OffsetKind::Value
@ Value
Definition InstCombineCompares.cpp:5867

JSON.h
This file supports working with JSON data.

Options
static LVOptions Options
Definition LVOptions.cpp:25

I
#define I(x, y, z)
Definition MD5.cpp:58

NativeFormatting.h

P
#define P(N)

STLExtras.h
This file contains some templates that are useful if you are working with the STL at all.

StringExtras.h
This file contains some functions that are useful when dealing with strings.

X
static TableGen::Emitter::OptClass< SkeletonEmitter > X("gen-skeleton-class", "Generate example skeleton class")

peek
static bool peek(struct InternalInstruction *insn, uint8_t &byte)
Definition X86Disassembler.cpp:191

RHS
Value * RHS
Definition X86PartialReduction.cpp:74

LHS
Value * LHS
Definition X86PartialReduction.cpp:73

llvm::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:41

llvm::Error
Lightweight error class with error context and mandatory checking.
Definition Error.h:159

llvm::Expected
Tagged union holding either a T or a Error.
Definition Error.h:485

llvm::StringLiteral
A wrapper around a string literal that serves as a proxy for constructing global tables of StringRefs...
Definition StringRef.h:862

llvm::StringRef
StringRef - Represent a constant reference to a string, i.e.
Definition StringRef.h:55

llvm::StringRef::size
constexpr size_t size() const
size - Get the string size.
Definition StringRef.h:154

llvm::StringRef::data
constexpr const char * data() const
data - Get a pointer to the start of the string (which may not be null terminated).
Definition StringRef.h:148

llvm::StringRef::take_front
StringRef take_front(size_t N=1) const
Return a StringRef equal to 'this' but with only the first N elements remaining.
Definition StringRef.h:590

llvm::StringRef::npos
static constexpr size_t npos
Definition StringRef.h:57

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:45

llvm::Type::Type
Type(LLVMContext &C, TypeID tid)
Definition Type.h:93

llvm::Value
LLVM Value Representation.
Definition Value.h:75

llvm::json::Array
An Array is a JSON array, which contains heterogeneous JSON values.
Definition JSON.h:166

llvm::json::Array::emplace_back
void emplace_back(Args &&...A)
Definition JSON.h:564

llvm::json::Array::Array
Array()=default

llvm::json::Array::back
Value & back()
Definition JSON.h:547

llvm::json::OStream
json::OStream allows writing well-formed JSON without materializing all structures as json::Value ahe...
Definition JSON.h:998

llvm::json::OStream::object
void object(Block Contents)
Emit an object whose elements are emitted in the provided Block.
Definition JSON.h:1028

llvm::json::OStream::rawValue
void rawValue(llvm::function_ref< void(raw_ostream &)> Contents)
Emit an externally-serialized value.
Definition JSON.h:1036

llvm::json::OStream::attributeBegin
LLVM_ABI void attributeBegin(llvm::StringRef Key)
Definition JSON.cpp:871

llvm::json::OStream::attribute
void attribute(llvm::StringRef Key, const Value &Contents)
Emit an attribute whose value is self-contained (number, vector<int> etc).
Definition JSON.h:1053

llvm::json::OStream::arrayBegin
LLVM_ABI void arrayBegin()
Definition JSON.cpp:833

llvm::json::OStream::objectBegin
LLVM_ABI void objectBegin()
Definition JSON.cpp:852

llvm::json::OStream::rawValueBegin
LLVM_ABI raw_ostream & rawValueBegin()
Definition JSON.cpp:899

llvm::json::OStream::comment
LLVM_ABI void comment(llvm::StringRef)
Emit a JavaScript comment associated with the next printed value.
Definition JSON.cpp:796

llvm::json::OStream::array
void array(Block Contents)
Emit an array whose elements are emitted in the provided Block.
Definition JSON.h:1022

llvm::json::OStream::arrayEnd
LLVM_ABI void arrayEnd()
Definition JSON.cpp:841

llvm::json::OStream::attributeEnd
LLVM_ABI void attributeEnd()
Definition JSON.cpp:891

llvm::json::OStream::value
LLVM_ABI void value(const Value &V)
Emit a self-contained value (number, string, vector<string> etc).
Definition JSON.cpp:747

llvm::json::OStream::rawValueEnd
LLVM_ABI void rawValueEnd()
Definition JSON.cpp:906

llvm::json::OStream::objectEnd
LLVM_ABI void objectEnd()
Definition JSON.cpp:860

llvm::json::ObjectKey
ObjectKey is a used to capture keys in Object.
Definition JSON.h:588

llvm::json::Object
An Object is a JSON object, which maps strings to heterogenous JSON values.
Definition JSON.h:98

llvm::json::Object::end
iterator end()
Definition JSON.h:117

llvm::json::Object::getBoolean
LLVM_ABI std::optional< bool > getBoolean(StringRef K) const
Definition JSON.cpp:47

llvm::json::Object::operator[]
LLVM_ABI Value & operator[](const ObjectKey &K)
Definition JSON.cpp:24

llvm::json::Object::getNumber
LLVM_ABI std::optional< double > getNumber(StringRef K) const
Definition JSON.cpp:52

llvm::json::Object::getObject
LLVM_ABI const json::Object * getObject(StringRef K) const
Definition JSON.cpp:67

llvm::json::Object::getString
LLVM_ABI std::optional< llvm::StringRef > getString(StringRef K) const
Definition JSON.cpp:62

llvm::json::Object::value_type
Storage::value_type value_type
Definition JSON.h:105

llvm::json::Object::get
LLVM_ABI Value * get(StringRef K)
Definition JSON.cpp:30

llvm::json::Object::getInteger
LLVM_ABI std::optional< int64_t > getInteger(StringRef K) const
Definition JSON.cpp:57

llvm::json::Object::getNull
LLVM_ABI std::optional< std::nullptr_t > getNull(StringRef K) const
Definition JSON.cpp:42

llvm::json::Object::try_emplace
std::pair< iterator, bool > try_emplace(const ObjectKey &K, Ts &&... Args)
Definition JSON.h:126

llvm::json::Object::find
iterator find(StringRef K)
Definition JSON.h:136

llvm::json::Object::getArray
LLVM_ABI const json::Array * getArray(StringRef K) const
Definition JSON.cpp:77

llvm::json::Object::Object
Object()=default

llvm::json::ParseError::ID
static LLVM_ABI char ID
Definition JSON.h:919

llvm::json::Path::Root
The root is the trivial Path to the root value.
Definition JSON.h:713

llvm::json::Path::Root::printErrorContext
LLVM_ABI void printErrorContext(const Value &, llvm::raw_ostream &) const
Print the root value with the error shown inline as a comment.
Definition JSON.cpp:300

llvm::json::Path::Root::getError
LLVM_ABI Error getError() const
Returns the last error reported, or else a generic error.
Definition JSON.cpp:219

llvm::json::Path::report
LLVM_ABI void report(llvm::StringLiteral Message)
Records that the value at the current path is invalid.
Definition JSON.cpp:204

llvm::json::Path::Path
Path(Root &R)
The root may be treated as a Path.
Definition JSON.h:676

llvm::json::Value
A Value is an JSON value of unknown type.
Definition JSON.h:290

llvm::json::Value::Object
friend class Object
Definition JSON.h:493

llvm::json::Value::print
LLVM_ABI void print(llvm::raw_ostream &OS) const
Definition JSON.cpp:176

llvm::json::Value::Value
Value(const Value &M)
Definition JSON.h:304

llvm::json::Value::Boolean
@ Boolean
Definition JSON.h:294

llvm::json::Value::String
@ String
Definition JSON.h:298

llvm::json::Value::Number
@ Number
Number values can store both int64s and doubles at full precision, depending on what they were constr...
Definition JSON.h:297

llvm::json::Value::Null
@ Null
Definition JSON.h:293

llvm::json::Value::Array
friend class Array
Definition JSON.h:492

llvm::raw_ostream
This class implements an extremely fast bulk output stream that can only output to a stream.
Definition raw_ostream.h:53

llvm::raw_string_ostream
A raw_ostream that writes to an std::string.
Definition raw_ostream.h:662

uint32_t

uint8_t

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition ErrorHandling.h:164

Error.h

llvm::CallingConv::C
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34

llvm::M68k::MemAddrModeKind::K
@ K
Definition M68kBaseInfo.h:68

llvm::RISCVFenceField::O
@ O
Definition RISCVBaseInfo.h:399

llvm::ifs::IFSSymbolType::Object
@ Object
Definition IFSStub.h:29

llvm::json
Definition TensorSpec.h:23

llvm::json::abbreviateChildren
static void abbreviateChildren(const Value &V, OStream &JOS)
Definition JSON.cpp:278

llvm::json::parse
LLVM_ABI llvm::Expected< Value > parse(llvm::StringRef JSON)
Parses the provided JSON source, or returns a ParseError.
Definition JSON.cpp:675

llvm::json::abbreviate
static void abbreviate(const Value &V, OStream &JOS)
Definition JSON.cpp:252

llvm::json::operator==
LLVM_ABI bool operator==(const Object &LHS, const Object &RHS)
Definition JSON.cpp:87

llvm::json::isUTF8
LLVM_ABI bool isUTF8(llvm::StringRef S, size_t *ErrOffset=nullptr)
Returns true if S is valid UTF-8, which is required for use as JSON.
Definition JSON.cpp:686

llvm::json::sortedElements
LLVM_ABI std::vector< const Object::value_type * > sortedElements(const Object &O)
Definition JSON.cpp:238

llvm::json::quote
static void quote(llvm::raw_ostream &OS, llvm::StringRef S)
Definition JSON.cpp:717

llvm::json::fixUTF8
LLVM_ABI std::string fixUTF8(llvm::StringRef S)
Replaces invalid UTF-8 sequences in S with the replacement character (U+FFFD).
Definition JSON.cpp:700

llvm::json::encodeUtf8
static void encodeUtf8(uint32_t Rune, std::string &Out)
Definition JSON.cpp:573

llvm::logicalview::LVSortMode::Line
@ Line
Definition LVSort.h:27

llvm::memprof::Meta::Start
@ Start
Definition MemProf.h:69

llvm::msgpack::Type::Array
@ Array
Definition MsgPackReader.h:62

llvm::pdb::PDB_MemoryType::Stack
@ Stack
Definition PDBTypes.h:328

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition AddressRanges.h:18

llvm::Value
FunctionAddr VTableAddr Value
Definition InstrProf.h:137

llvm::ConvertUTF8toUTF32
LLVM_ABI ConversionResult ConvertUTF8toUTF32(const UTF8 **sourceStart, const UTF8 *sourceEnd, UTF32 **targetStart, UTF32 *targetEnd, ConversionFlags flags)
Convert a partial UTF8 sequence to UTF32.
Definition ConvertUTF.cpp:736

llvm::inconvertibleErrorCode
LLVM_ABI std::error_code inconvertibleErrorCode()
The value returned by this function can be returned from convertToErrorCode for Error values where no...
Definition Error.cpp:98

llvm::createStringError
Error createStringError(std::error_code EC, char const *Fmt, const Ts &... Vals)
Create formatted StringError object.
Definition Error.h:1305

llvm::lenientConversion
@ lenientConversion
Definition ConvertUTF.h:158

llvm::strictConversion
@ strictConversion
Definition ConvertUTF.h:157

llvm::HexPrintStyle::Lower
@ Lower
Definition NativeFormatting.h:23

llvm::reverse
auto reverse(ContainerTy &&C)
Definition STLExtras.h:420

llvm::sort
void sort(IteratorTy Start, IteratorTy End)
Definition STLExtras.h:1652

llvm::Count
FunctionAddr VTableAddr Count
Definition InstrProf.h:139

llvm::format
format_object< Ts... > format(const char *Fmt, const Ts &... Vals)
These are helper functions used to produce formatted output.
Definition Format.h:126

llvm::Key
LLVM_ATTRIBUTE_VISIBILITY_DEFAULT AnalysisKey InnerAnalysisManagerProxy< AnalysisManagerT, IRUnitT, ExtraArgTs... >::Key
Definition PassManager.h:668

llvm::IRMemLocation::First
@ First
Helpers to iterate all locations in the MemoryEffectsBase class.
Definition ModRef.h:71

llvm::Data
FunctionAddr VTableAddr uintptr_t uintptr_t Data
Definition InstrProf.h:189

llvm::write_hex
LLVM_ABI void write_hex(raw_ostream &S, uint64_t N, HexPrintStyle Style, std::optional< size_t > Width=std::nullopt)
Definition NativeFormatting.cpp:134

llvm::ConvertUTF32toUTF8
LLVM_ABI ConversionResult ConvertUTF32toUTF8(const UTF32 **sourceStart, const UTF32 *sourceEnd, UTF8 **targetStart, UTF8 *targetEnd, ConversionFlags flags)
Definition ConvertUTF.cpp:333

llvm::isASCII
bool isASCII(char C)
Checks whether character C is valid ASCII (high bit is zero).
Definition StringExtras.h:125

llvm::isLegalUTF8String
LLVM_ABI Boolean isLegalUTF8String(const UTF8 **source, const UTF8 *sourceEnd)
Definition ConvertUTF.cpp:555

llvm::UTF8
unsigned char UTF8
Definition ConvertUTF.h:131

llvm::UTF32
unsigned int UTF32
Definition ConvertUTF.h:129

llvm::Invalid
@ Invalid
Definition PGOCtxProfWriter.h:24

raw_ostream.h

llvm::format_provider
Definition FormatVariadicDetails.h:20