-
Notifications
You must be signed in to change notification settings - Fork 74
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
feat(clp-s): Add boilerplate for SQL parsing. (#504)
Co-authored-by: Lin Zhihao <[email protected]>
- Loading branch information
1 parent
09bab5a
commit 0c00a94
Showing
11 changed files
with
193 additions
and
30 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,4 +1,5 @@ | ||
add_subdirectory(search/kql) | ||
add_subdirectory(search/sql) | ||
|
||
set( | ||
CLP_SOURCES | ||
|
36 changes: 36 additions & 0 deletions
36
components/core/src/clp_s/search/antlr_common/ErrorListener.hpp
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,36 @@ | ||
#ifndef CLP_S_SEARCH_ANTLRCOMMON_ERRORLISTENER_HPP | ||
#define CLP_S_SEARCH_ANTLRCOMMON_ERRORLISTENER_HPP | ||
|
||
#include <cstddef> | ||
#include <exception> | ||
#include <string> | ||
#include <string_view> | ||
|
||
#include <antlr4-runtime.h> | ||
|
||
namespace clp_s::search::antlr_common { | ||
class ErrorListener : public antlr4::BaseErrorListener { | ||
public: | ||
auto syntaxError( | ||
[[maybe_unused]] antlr4::Recognizer* recognizer, | ||
[[maybe_unused]] antlr4::Token* offending_symbol, | ||
[[maybe_unused]] size_t line, | ||
[[maybe_unused]] size_t char_position_in_line, | ||
std::string const& msg, | ||
[[maybe_unused]] std::exception_ptr e | ||
) -> void override { | ||
m_error = true; | ||
m_error_message = msg; | ||
} | ||
|
||
[[nodiscard]] auto error() const -> bool { return m_error; } | ||
|
||
[[nodiscard]] auto message() const -> std::string_view { return m_error_message; } | ||
|
||
private: | ||
bool m_error{false}; | ||
std::string m_error_message; | ||
}; | ||
} // namespace clp_s::search::antlr_common | ||
|
||
#endif // CLP_S_SEARCH_ANTLRCOMMON_ERRORLISTENER_HPP |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,29 @@ | ||
ANTLR_TARGET( | ||
SqlParser | ||
Sql.g4 | ||
LEXER PARSER VISITOR | ||
PACKAGE sql | ||
) | ||
|
||
add_library( | ||
sql | ||
../../Utils.hpp | ||
../antlr_common/ErrorListener.hpp | ||
../AndExpr.hpp | ||
../BooleanLiteral.hpp | ||
../ColumnDescriptor.hpp | ||
../DateLiteral.hpp | ||
../EmptyExpr.hpp | ||
../Expression.hpp | ||
../FilterExpr.hpp | ||
../Integral.hpp | ||
../NullLiteral.hpp | ||
../OrExpr.hpp | ||
../StringLiteral.hpp | ||
${ANTLR_SqlParser_CXX_OUTPUTS} | ||
sql.cpp | ||
sql.hpp | ||
) | ||
target_compile_features(sql PRIVATE cxx_std_20) | ||
target_include_directories(sql PRIVATE ${ANTLR_SqlParser_OUTPUT_DIR}) | ||
target_link_libraries(sql PRIVATE antlr4_static Boost::filesystem) |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,6 @@ | ||
// Boilerplate for work in progress SQL grammar. | ||
grammar Sql; | ||
|
||
start: EOF ; | ||
|
||
SPACE: [ \t\r\n] -> skip ; |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,63 @@ | ||
#include <any> | ||
#include <iostream> | ||
#include <memory> | ||
|
||
#include <antlr4-runtime.h> | ||
#include <spdlog/spdlog.h> | ||
|
||
#include "../antlr_common/ErrorListener.hpp" | ||
#include "../EmptyExpr.hpp" | ||
#include "../Expression.hpp" | ||
#include "SqlBaseVisitor.h" | ||
#include "SqlLexer.h" | ||
#include "SqlParser.h" | ||
|
||
using antlr4::ANTLRInputStream; | ||
using antlr4::CommonTokenStream; | ||
using clp_s::search::antlr_common::ErrorListener; | ||
using sql::SqlBaseVisitor; | ||
using sql::SqlLexer; | ||
using sql::SqlParser; | ||
|
||
namespace clp_s::search::sql { | ||
namespace { | ||
class ParseTreeVisitor : public SqlBaseVisitor { | ||
public: | ||
[[nodiscard]] auto visitStart([[maybe_unused]] SqlParser::StartContext* ctx) | ||
-> std::any override { | ||
return EmptyExpr::create(); | ||
} | ||
}; | ||
} // namespace | ||
|
||
auto parse_sql_expression(std::istream& in) -> std::shared_ptr<Expression> { | ||
ErrorListener lexer_error_listener; | ||
ErrorListener parser_error_listener; | ||
|
||
ANTLRInputStream input{in}; | ||
SqlLexer lexer{&input}; | ||
lexer.removeErrorListeners(); | ||
lexer.addErrorListener(&lexer_error_listener); | ||
CommonTokenStream tokens{&lexer}; | ||
SqlParser parser(&tokens); | ||
parser.removeErrorListeners(); | ||
parser.addErrorListener(&parser_error_listener); | ||
SqlParser::StartContext* tree{parser.start()}; | ||
|
||
if (lexer_error_listener.error()) { | ||
SPDLOG_ERROR("Lexer error: {}", lexer_error_listener.message()); | ||
return nullptr; | ||
} | ||
if (parser_error_listener.error()) { | ||
SPDLOG_ERROR("Parser error: {}", parser_error_listener.message()); | ||
return nullptr; | ||
} | ||
|
||
ParseTreeVisitor visitor; | ||
try { | ||
return std::any_cast<std::shared_ptr<Expression>>(visitor.visitStart(tree)); | ||
} catch (std::exception const& e) { | ||
return nullptr; | ||
} | ||
} | ||
} // namespace clp_s::search::sql |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,18 @@ | ||
#ifndef CLP_S_SEARCH_SQL_SQL_HPP | ||
#define CLP_S_SEARCH_SQL_SQL_HPP | ||
|
||
#include <istream> | ||
#include <memory> | ||
|
||
#include "../Expression.hpp" | ||
|
||
namespace clp_s::search::sql { | ||
/** | ||
* Parses an SQL expression from the given stream to generate a search AST. | ||
* @param in Input stream containing an SQL expression followed by EOF | ||
* @return a search AST on success, nullptr otherwise | ||
*/ | ||
[[nodiscard]] auto parse_sql_expression(std::istream& in) -> std::shared_ptr<Expression>; | ||
} // namespace clp_s::search::sql | ||
|
||
#endif // CLP_S_SEARCH_SQL_SQL_HPP |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,23 @@ | ||
#include <memory> | ||
#include <sstream> | ||
|
||
#include <Catch2/single_include/catch2/catch.hpp> | ||
|
||
#include "../src/clp_s/search/EmptyExpr.hpp" | ||
#include "../src/clp_s/search/sql/sql.hpp" | ||
#include "LogSuppressor.hpp" | ||
|
||
using clp_s::search::EmptyExpr; | ||
using clp_s::search::sql::parse_sql_expression; | ||
using std::stringstream; | ||
|
||
TEST_CASE("Test parsing SQL", "[SQL]") { | ||
// Suppress logging | ||
LogSuppressor const suppressor; | ||
|
||
SECTION("Stub accepts empty string") { | ||
stringstream empty_string{""}; | ||
auto filter = std::dynamic_pointer_cast<EmptyExpr>(parse_sql_expression(empty_string)); | ||
REQUIRE((nullptr != filter)); | ||
} | ||
} |