mirror of
https://gitlab.com/manzerbredes/pgnp.git
synced 2025-04-06 10:06:25 +02:00
Improve location pointer type flexibility
This commit is contained in:
parent
f144f14d9c
commit
3f9ab56bd6
6 changed files with 25 additions and 23 deletions
|
@ -9,7 +9,7 @@ PGN specification can be found [here](https://www.chessclub.com/help/PGN-spec).
|
||||||
# Features
|
# Features
|
||||||
- Basic PGN parsing (tags, move, comments, variations, NAG, etc.)
|
- Basic PGN parsing (tags, move, comments, variations, NAG, etc.)
|
||||||
- Merged PGN files parsing (several games in one file)
|
- Merged PGN files parsing (several games in one file)
|
||||||
- Handle very large file (max is 2^(sizeof(unsigned long long)) bytes)
|
- Handle very large file (max is 2^(sizeof(unsigned long long)*8) bytes)
|
||||||
- Efficiency
|
- Efficiency
|
||||||
|
|
||||||
# How to use it ?
|
# How to use it ?
|
||||||
|
|
|
@ -23,7 +23,7 @@ void LargeFileStream::ReadNextChunk() {
|
||||||
last_read_size = file.gcount();
|
last_read_size = file.gcount();
|
||||||
}
|
}
|
||||||
|
|
||||||
char LargeFileStream::operator[](ull loc) {
|
char LargeFileStream::operator[](loctype loc) {
|
||||||
// Perform various checks
|
// Perform various checks
|
||||||
if (eof) {
|
if (eof) {
|
||||||
throw ReadToFar();
|
throw ReadToFar();
|
||||||
|
@ -42,11 +42,11 @@ char LargeFileStream::operator[](ull loc) {
|
||||||
}
|
}
|
||||||
|
|
||||||
// Goto the right memory chuck
|
// Goto the right memory chuck
|
||||||
ull loc_chunk_count = loc / BUFFER_SIZE;
|
loctype loc_chunk_count = loc / BUFFER_SIZE;
|
||||||
while (chuck_count < loc_chunk_count) {
|
while (chuck_count < loc_chunk_count) {
|
||||||
ReadNextChunk();
|
ReadNextChunk();
|
||||||
}
|
}
|
||||||
ull offset = loc - (loc_chunk_count * BUFFER_SIZE);
|
loctype offset = loc - (loc_chunk_count * BUFFER_SIZE);
|
||||||
|
|
||||||
// Ensure for EOF
|
// Ensure for EOF
|
||||||
if (!file && offset >= last_read_size) {
|
if (!file && offset >= last_read_size) {
|
||||||
|
|
|
@ -16,11 +16,11 @@ class LargeFileStream {
|
||||||
/// @brief In memory buffer
|
/// @brief In memory buffer
|
||||||
char buffer[BUFFER_SIZE];
|
char buffer[BUFFER_SIZE];
|
||||||
/// @brief Number of chuck read minus 1
|
/// @brief Number of chuck read minus 1
|
||||||
ull chuck_count;
|
loctype chuck_count;
|
||||||
/// @brief Number of byte read during the last file access
|
/// @brief Number of byte read during the last file access
|
||||||
ull last_read_size;
|
loctype last_read_size;
|
||||||
/// @brief Keep track of the file offset (to prevent backward read)
|
/// @brief Keep track of the file offset (to prevent backward read)
|
||||||
ull last_loc;
|
loctype last_loc;
|
||||||
/// @brief Use a string as file content
|
/// @brief Use a string as file content
|
||||||
std::string content;
|
std::string content;
|
||||||
/// @brief Use to shortcut some methods
|
/// @brief Use to shortcut some methods
|
||||||
|
@ -37,7 +37,7 @@ public:
|
||||||
/// @brief Emulate file access with a string
|
/// @brief Emulate file access with a string
|
||||||
void FromString(std::string content);
|
void FromString(std::string content);
|
||||||
/// @brief Allow array like access to the file
|
/// @brief Allow array like access to the file
|
||||||
char operator[](ull loc);
|
char operator[](loctype loc);
|
||||||
/// @brief Check if we reach the EOF
|
/// @brief Check if we reach the EOF
|
||||||
bool IsEOF();
|
bool IsEOF();
|
||||||
|
|
||||||
|
|
16
src/PGN.cpp
16
src/PGN.cpp
|
@ -45,7 +45,7 @@ void PGN::ParseNextGame() {
|
||||||
if (IS_EOF) {
|
if (IS_EOF) {
|
||||||
throw NoGameFound();
|
throw NoGameFound();
|
||||||
}
|
}
|
||||||
ull loc = GotoNextToken(LastGameEndLoc);
|
loctype loc = GotoNextToken(LastGameEndLoc);
|
||||||
if (IS_EOF) {
|
if (IS_EOF) {
|
||||||
throw NoGameFound();
|
throw NoGameFound();
|
||||||
}
|
}
|
||||||
|
@ -103,7 +103,7 @@ bool PGN::HasTag(std::string key) {
|
||||||
return (std::find(tags.begin(), tags.end(), key) != tags.end());
|
return (std::find(tags.begin(), tags.end(), key) != tags.end());
|
||||||
}
|
}
|
||||||
|
|
||||||
ull PGN::ParseComment(ull loc, HalfMove *hm) {
|
loctype PGN::ParseComment(loctype loc, HalfMove *hm) {
|
||||||
// Goto next char
|
// Goto next char
|
||||||
loc = GotoNextToken(loc);
|
loc = GotoNextToken(loc);
|
||||||
EOF_CHECK(loc);
|
EOF_CHECK(loc);
|
||||||
|
@ -131,7 +131,7 @@ ull PGN::ParseComment(ull loc, HalfMove *hm) {
|
||||||
return (loc);
|
return (loc);
|
||||||
}
|
}
|
||||||
|
|
||||||
ull PGN::ParseHalfMove(ull loc, HalfMove *hm) {
|
loctype PGN::ParseHalfMove(loctype loc, HalfMove *hm) {
|
||||||
// Goto next char
|
// Goto next char
|
||||||
loc = GotoNextToken(loc);
|
loc = GotoNextToken(loc);
|
||||||
EOF_CHECK(loc);
|
EOF_CHECK(loc);
|
||||||
|
@ -249,10 +249,10 @@ ull PGN::ParseHalfMove(ull loc, HalfMove *hm) {
|
||||||
return (loc);
|
return (loc);
|
||||||
}
|
}
|
||||||
|
|
||||||
ull PGN::ParseNextTag(ull start_loc) {
|
loctype PGN::ParseNextTag(loctype start_loc) {
|
||||||
// Parse key
|
// Parse key
|
||||||
std::string key;
|
std::string key;
|
||||||
ull keyloc = start_loc + 1;
|
loctype keyloc = start_loc + 1;
|
||||||
EOF_CHECK(keyloc);
|
EOF_CHECK(keyloc);
|
||||||
char c = pgn_content[keyloc];
|
char c = pgn_content[keyloc];
|
||||||
while (!IS_BLANK(c)) {
|
while (!IS_BLANK(c)) {
|
||||||
|
@ -264,7 +264,7 @@ ull PGN::ParseNextTag(ull start_loc) {
|
||||||
|
|
||||||
// Parse value
|
// Parse value
|
||||||
std::string value;
|
std::string value;
|
||||||
ull valueloc = GotoNextToken(keyloc) + 1;
|
loctype valueloc = GotoNextToken(keyloc) + 1;
|
||||||
EOF_CHECK(keyloc);
|
EOF_CHECK(keyloc);
|
||||||
c = pgn_content[valueloc];
|
c = pgn_content[valueloc];
|
||||||
while (c != '"' or IS_EOF) {
|
while (c != '"' or IS_EOF) {
|
||||||
|
@ -312,7 +312,7 @@ std::string PGN::Dump() {
|
||||||
return (ss.str());
|
return (ss.str());
|
||||||
}
|
}
|
||||||
|
|
||||||
ull PGN::GotoNextToken(ull loc) {
|
loctype PGN::GotoNextToken(loctype loc) {
|
||||||
char c = pgn_content[loc];
|
char c = pgn_content[loc];
|
||||||
while (IS_BLANK(c)) {
|
while (IS_BLANK(c)) {
|
||||||
loc++;
|
loc++;
|
||||||
|
@ -331,7 +331,7 @@ ull PGN::GotoNextToken(ull loc) {
|
||||||
return (loc);
|
return (loc);
|
||||||
}
|
}
|
||||||
|
|
||||||
ull PGN::GotoEOL(ull loc) {
|
loctype PGN::GotoEOL(loctype loc) {
|
||||||
char c = pgn_content[loc];
|
char c = pgn_content[loc];
|
||||||
while (true) {
|
while (true) {
|
||||||
loc++;
|
loc++;
|
||||||
|
|
14
src/PGN.hpp
14
src/PGN.hpp
|
@ -24,7 +24,7 @@ private:
|
||||||
LargeFileStream pgn_content;
|
LargeFileStream pgn_content;
|
||||||
/// @brief Contains the location of the end of the last parsed game (1 PGN
|
/// @brief Contains the location of the end of the last parsed game (1 PGN
|
||||||
/// file may have multiple games)
|
/// file may have multiple games)
|
||||||
ull LastGameEndLoc;
|
loctype LastGameEndLoc;
|
||||||
|
|
||||||
public:
|
public:
|
||||||
PGN();
|
PGN();
|
||||||
|
@ -55,16 +55,16 @@ public:
|
||||||
private:
|
private:
|
||||||
/// @brief Populate @a tags with by parsing the one starting at location in
|
/// @brief Populate @a tags with by parsing the one starting at location in
|
||||||
/// argument
|
/// argument
|
||||||
ull ParseNextTag(ull);
|
loctype ParseNextTag(loctype);
|
||||||
/// @brief Parse a HalfMove at a specific location into @a pgn_content
|
/// @brief Parse a HalfMove at a specific location into @a pgn_content
|
||||||
ull ParseHalfMove(ull, HalfMove *);
|
loctype ParseHalfMove(loctype, HalfMove *);
|
||||||
/// @brief Parse a consecutive sequence of comment
|
/// @brief Parse a consecutive sequence of comment
|
||||||
ull ParseComment(ull, HalfMove *);
|
loctype ParseComment(loctype, HalfMove *);
|
||||||
/// @brief Get the next non-blank char location ignoring line comments ('%'
|
/// @brief Get the next non-blank char location ignoring line comments ('%'
|
||||||
/// and ';')
|
/// and ';')
|
||||||
ull GotoNextToken(ull);
|
loctype GotoNextToken(loctype);
|
||||||
/// @brief Goto the end of the current line
|
/// @brief Goto the end of the current line
|
||||||
ull GotoEOL(ull);
|
loctype GotoEOL(loctype);
|
||||||
};
|
};
|
||||||
|
|
||||||
struct UnexpectedEOF : public std::exception {
|
struct UnexpectedEOF : public std::exception {
|
||||||
|
@ -85,7 +85,7 @@ struct NoGameFound : public std::exception {
|
||||||
|
|
||||||
struct UnexpectedCharacter : public std::exception {
|
struct UnexpectedCharacter : public std::exception {
|
||||||
std::string msg;
|
std::string msg;
|
||||||
UnexpectedCharacter(char actual, char required, ull loc) {
|
UnexpectedCharacter(char actual, char required, loctype loc) {
|
||||||
std::stringstream ss;
|
std::stringstream ss;
|
||||||
ss << "Expected \'" << required << "\' at location " << loc
|
ss << "Expected \'" << required << "\' at location " << loc
|
||||||
<< " but read \'" << actual << "\'";
|
<< " but read \'" << actual << "\'";
|
||||||
|
|
|
@ -2,4 +2,6 @@
|
||||||
|
|
||||||
namespace pgnp {
|
namespace pgnp {
|
||||||
typedef unsigned long long ull;
|
typedef unsigned long long ull;
|
||||||
|
typedef unsigned int uint;
|
||||||
|
typedef ull loctype; // Choose location pointer type
|
||||||
}
|
}
|
Loading…
Add table
Reference in a new issue