Allow '/*...*/' and '//' comments to appear anywhere in HLO text, including multi-line comments. Previously only '/*...*/' comments were only allowed and only in certain locations in a serialized Literal. PiperOrigin-RevId: 208519204
132 lines
4.0 KiB
C++
132 lines
4.0 KiB
C++
/* Copyright 2017 The TensorFlow Authors. All Rights Reserved.
|
|
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
you may not use this file except in compliance with the License.
|
|
You may obtain a copy of the License at
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
See the License for the specific language governing permissions and
|
|
limitations under the License.
|
|
==============================================================================*/
|
|
|
|
#ifndef TENSORFLOW_COMPILER_XLA_SERVICE_HLO_LEXER_H_
|
|
#define TENSORFLOW_COMPILER_XLA_SERVICE_HLO_LEXER_H_
|
|
|
|
#include <string>
|
|
|
|
#include "tensorflow/compiler/xla/service/hlo_token.h"
|
|
#include "tensorflow/compiler/xla/types.h"
|
|
#include "tensorflow/compiler/xla/xla_data.pb.h"
|
|
#include "tensorflow/core/lib/core/stringpiece.h"
|
|
#include "tensorflow/core/platform/logging.h"
|
|
#include "tensorflow/core/platform/regexp.h"
|
|
#include "tensorflow/core/platform/types.h"
|
|
|
|
namespace xla {
|
|
|
|
// Lexer for the HloModule::ToString() format text.
|
|
//
|
|
// This class is meant to be used by hlo_parser.cc. You shouldn't need to use
|
|
// it directly.
|
|
class HloLexer {
|
|
public:
|
|
explicit HloLexer(tensorflow::StringPiece buf) : buf_(buf) {
|
|
current_ptr_ = buf_.begin();
|
|
}
|
|
|
|
TokKind Lex() { return current_kind_ = LexToken(); }
|
|
|
|
TokKind GetKind() const { return current_kind_; }
|
|
string GetStrVal() const {
|
|
switch (GetKind()) {
|
|
case TokKind::kName:
|
|
case TokKind::kAttributeName:
|
|
case TokKind::kDimLabels:
|
|
case TokKind::kDxD:
|
|
case TokKind::kPad:
|
|
case TokKind::kString:
|
|
case TokKind::kIdent:
|
|
return str_val_;
|
|
default:
|
|
LOG(FATAL) << "This token does not have string value";
|
|
}
|
|
}
|
|
Shape GetShapeVal() const {
|
|
CHECK(GetKind() == TokKind::kShape);
|
|
return shape_val_;
|
|
}
|
|
tensorflow::int64 GetInt64Val() const {
|
|
CHECK(GetKind() == TokKind::kInt);
|
|
return int64_val_;
|
|
}
|
|
double GetDecimalVal() const {
|
|
CHECK(GetKind() == TokKind::kDecimal);
|
|
return decimal_val_;
|
|
}
|
|
|
|
typedef const char* LocTy;
|
|
|
|
// Returns the location of the current token.
|
|
LocTy GetLoc() const { return token_start_; }
|
|
|
|
// Returns the line and column of a location in the buffer.
|
|
std::pair<unsigned, unsigned> GetLineAndColumn(LocTy location) const;
|
|
|
|
// Returns the whole line given the location.
|
|
tensorflow::StringPiece GetLine(LocTy loc) const;
|
|
|
|
private:
|
|
// Returns the current character. If it's neither the end of input buffer nor
|
|
// an invalid character, moves the pointer forward.
|
|
int GetNextChar();
|
|
|
|
// Returns the current character.
|
|
int PeekCurrentChar() const;
|
|
|
|
// Creates StringPiece with the given begin and end. Exits if the begin > end,
|
|
// or it's out of the range of the current buffer.
|
|
tensorflow::StringPiece StringPieceFromPointers(const char* begin,
|
|
const char* end) const;
|
|
tensorflow::RegexpStringPiece RegexpStringPieceFromPointers(
|
|
const char* begin, const char* end) const;
|
|
|
|
// Returns true if the given ptr is dereferenceable within the range of the
|
|
// current buffer.
|
|
bool CanDereference(const char* ptr) const;
|
|
|
|
TokKind LexToken();
|
|
|
|
TokKind LexIdentifier();
|
|
TokKind LexPercent();
|
|
TokKind LexShape();
|
|
TokKind LexConstant();
|
|
TokKind LexNumberOrPattern();
|
|
TokKind LexString();
|
|
|
|
const tensorflow::StringPiece buf_;
|
|
const char* current_ptr_;
|
|
|
|
// Information about the current token.
|
|
const char* token_start_;
|
|
TokKind current_kind_;
|
|
string str_val_;
|
|
Shape shape_val_;
|
|
tensorflow::int64 int64_val_;
|
|
double decimal_val_;
|
|
|
|
struct LineNoCacheTy {
|
|
const char* last_query;
|
|
unsigned line_no_of_query;
|
|
};
|
|
// This caches the line number of the previous query.
|
|
mutable LineNoCacheTy line_no_cache_{nullptr, 0};
|
|
};
|
|
|
|
} // namespace xla
|
|
|
|
#endif // TENSORFLOW_COMPILER_XLA_SERVICE_HLO_LEXER_H_
|