MUSX Document Model
Loading...
Searching...
No Matches
EnigmaString.h
1/*
2 * Copyright (C) 2025, Robert Patterson
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a copy
5 * of this software and associated documentation files (the "Software"), to deal
6 * in the Software without restriction, including without limitation the rights
7 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
8 * copies of the Software, and to permit persons to whom the Software is
9 * furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
13 *
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
17 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
18 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
19 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
20 * THE SOFTWARE.
21 */
22#pragma once
23
24#include <cassert>
25#include <string>
26#include <string_view>
27#include <vector>
28#include <functional>
29#include <memory>
30#include <unordered_set>
31
32#include "musx/dom/Fundamentals.h"
33#include "musx/dom/MusxInstance.h"
34
35namespace musx {
36
37namespace dom {
38class FontInfo;
39class Document;
40class TextsBase;
41
42namespace options {
44}
45
46} // namespace dom
47
48namespace util {
49
53{
61 {
62 None,
63 MusicFont,
64 TextFont,
66 };
67
69 EnigmaStyles(const std::weak_ptr<dom::Document>& document)
70 : font(std::make_shared<dom::FontInfo>(document))
71 {
72 }
73
76 {
77 EnigmaStyles result = *this;
78 result.font = std::make_shared<dom::FontInfo>(*this->font);
79 return result;
80 }
81
82 std::shared_ptr<dom::FontInfo> font;
86 int tracking{};
87};
88
89class EnigmaParsingContext;
90
157{
158public:
160 template <typename CharT>
161 static std::string fromU8(const CharT* s)
162 {
163 static_assert(std::is_same<CharT, char>::value || std::is_same<CharT, decltype(u8'a')>::value,
164 "fromU8() only accepts char or char8_t pointers");
165 return std::string(reinterpret_cast<const char*>(s));
166 }
167
169 static std::string toU8(char32_t cp);
170
177 {
184
192 };
193
200 {
212 Ascii,
213
225 Unicode,
226
238 Smufl
239 };
240
293
295 static bool startsWithFontCommand(const std::string& text);
296
298 static bool startsWithStyleCommand(const std::string& text);
299
301 static std::optional<dom::options::AccidentalInsertSymbolType> commandIsAccidentalType(std::string_view commandText);
302
323 static std::vector<std::string> parseComponents(const std::string& input, size_t* parsedLength = nullptr);
324
329 using TextChunkCallback = std::function<bool(
330 const std::string& text,
331 const EnigmaStyles& styles
332 )>;
333
343 using TextInsertCallback = std::function<std::optional<std::string>(
344 const std::vector<std::string>& parsedCommand
345 )>;
346
348 static inline TextInsertCallback defaultInsertsCallback = [](const std::vector<std::string>&) { return std::nullopt; };
349
375 static bool parseEnigmaText(const std::shared_ptr<dom::Document>& document, dom::Cmper forPartId, const std::string& rawText,
376 const TextChunkCallback& onText, const TextInsertCallback& onInsert,
377 const EnigmaParsingOptions& options = {}, const EnigmaParsingContext* parsingContext = nullptr)
378 {
379 return parseEnigmaTextImpl(document, forPartId, rawText, onText, onInsert, options, parsingContext, EnigmaStyles(document));
380 }
381
391 static bool parseEnigmaText(const std::shared_ptr<dom::Document>& document, dom::Cmper forPartId, const std::string& rawText, const TextChunkCallback& onText,
392 const EnigmaParsingOptions& options = {}, const EnigmaParsingContext* parsingContext = nullptr)
393 {
394 return parseEnigmaTextImpl(document, forPartId, rawText, onText, defaultInsertsCallback, options, parsingContext, EnigmaStyles(document));
395 }
396
405 static bool parseStyleCommand(std::vector<std::string> components, EnigmaStyles& styles);
406
408 static std::string trimTags(const std::string& input);
409
410private:
411 static bool parseEnigmaTextImpl(const std::shared_ptr<dom::Document>& document, dom::Cmper forPartId, const std::string& rawText,
412 const TextChunkCallback& onText, const TextInsertCallback& onInsert,
413 const EnigmaParsingOptions& options, const EnigmaParsingContext* parsingContext,
414 const EnigmaStyles& startingStyles);
415};
416
424{
425private:
427 dom::Cmper m_forPartId;
428 std::optional<int> m_forPageNumber;
430
431public:
434 : m_rawText(nullptr), m_forPartId(dom::SCORE_PARTID), m_insertFunc(EnigmaString::defaultInsertsCallback)
435 {}
436
443 std::optional<dom::Cmper> forPageId = std::nullopt,
445 : m_rawText(std::move(rawText)), m_forPartId(forPartId), m_forPageNumber(forPageId), m_insertFunc(insertFunc)
446 {}
447
449 explicit operator bool() const noexcept
450 { return static_cast<bool>(m_rawText); }
451
452 std::string affixText;
454
460 std::string getText(bool trimTags = false,
462 const std::unordered_set<std::string_view>& ignoreTags = {}) const;
463
471 const EnigmaString::TextInsertCallback& onInsert,
472 const EnigmaString::EnigmaParsingOptions& options = {}) const;
473
479 const EnigmaString::EnigmaParsingOptions& options = {}) const
480 {
482 }
483
489
491 dom::MusxInstance<dom::TextsBase> getRawText() const { return m_rawText; }
492
493 // If there is ever a need for a non-const version of the pointer, we can always
494 // look it up again.
495
497 dom::Cmper getRequestedPartId() const { return m_forPartId; }
498
500 std::optional<int> getPageNumber() const { return m_forPageNumber; }
501};
502
503} // namespace util
504} // namespace musx
Wrapper class for interpreting and rendering Enigma-style strings with insert handling.
Definition EnigmaString.h:424
bool affixIsPrefix
True if affixText is a prefix; false if it is a suffix.
Definition EnigmaString.h:453
std::string getText(bool trimTags=false, EnigmaString::AccidentalStyle accidentalStyle=EnigmaString::AccidentalStyle::Ascii, const std::unordered_set< std::string_view > &ignoreTags={}) const
Return displayable text with Enigma tags converted.
Definition EnigmaString.cpp:605
dom::MusxInstance< dom::FontInfo > parseFirstFontInfo() const
Returns a shared pointer to a FontInfo instance that reflects the first font information in the text.
Definition EnigmaString.cpp:619
bool parseEnigmaText(const EnigmaString::TextChunkCallback &onText, const EnigmaString::EnigmaParsingOptions &options={}) const
Parse the Enigma text into structured chunks with insert handling.
Definition EnigmaString.h:478
dom::Cmper getRequestedPartId() const
Get the requested part id.
Definition EnigmaString.h:497
std::optional< int > getPageNumber() const
Get the page number that was supplied, if any.
Definition EnigmaString.h:500
dom::MusxInstance< dom::TextsBase > getRawText() const
Get the raw text pointer.
Definition EnigmaString.h:491
EnigmaParsingContext(dom::MusxInstance< dom::TextsBase > rawText, dom::Cmper forPartId, std::optional< dom::Cmper > forPageId=std::nullopt, EnigmaString::TextInsertCallback insertFunc=EnigmaString::defaultInsertsCallback)
Constructor.
Definition EnigmaString.h:442
bool parseEnigmaText(const EnigmaString::TextChunkCallback &onText, const EnigmaString::TextInsertCallback &onInsert, const EnigmaString::EnigmaParsingOptions &options={}) const
Parse the Enigma text into structured chunks with insert handling.
Definition EnigmaString.cpp:582
EnigmaParsingContext()
Null constructor.
Definition EnigmaString.h:433
std::string affixText
Prefix or suffix to be passed in parsing options.
Definition EnigmaString.h:452
Static class that provides utilities to extract information from enigma strings. Enigma strings use t...
Definition EnigmaString.h:157
static std::string trimTags(const std::string &input)
Trims all enigma tags from an enigma string, leaving just the plain text.
Definition EnigmaString.cpp:547
static std::string fromU8(const CharT *s)
Convert u8"" literals to std::string in a way that works both in C++17 and C++20+.
Definition EnigmaString.h:161
static std::optional< dom::options::AccidentalInsertSymbolType > commandIsAccidentalType(std::string_view commandText)
Returns the accidental insert symbol type if the input command is an accidental insert.
Definition EnigmaString.cpp:263
static bool startsWithStyleCommand(const std::string &text)
Returns true if the enigma string starts with a style insert.
Definition EnigmaString.cpp:131
static bool parseStyleCommand(std::vector< std::string > components, EnigmaStyles &styles)
Incorporates an enigma font insert into the supplied dom::FontInfo instance.
Definition EnigmaString.cpp:209
static bool startsWithFontCommand(const std::string &text)
Returns true if the enigma string starts with a font insert.
Definition EnigmaString.cpp:119
AccidentalStyle
Enumeration to specify the type of accidental substitution representation.
Definition EnigmaString.h:200
@ Smufl
Use SMuFL notation-specific accidentals.
@ Ascii
Use ASCII substitutions for accidentals.
@ Unicode
Use Unicode text accidentals.
static std::string toU8(char32_t cp)
Concerts a 32-bit codepoint to a utf8-encoded std::string.
Definition EnigmaString.cpp:94
static bool parseEnigmaText(const std::shared_ptr< dom::Document > &document, dom::Cmper forPartId, const std::string &rawText, const TextChunkCallback &onText, const TextInsertCallback &onInsert, const EnigmaParsingOptions &options={}, const EnigmaParsingContext *parsingContext=nullptr)
Parses an Enigma-formatted string, handling font inserts and escaped carets.
Definition EnigmaString.h:375
static TextInsertCallback defaultInsertsCallback
Inserts callback to take all default insert subsitutions determined by parseEnigmaText.
Definition EnigmaString.h:348
AccidentalInsertHandling
Enumeration to specify the default handling for accidental insert commands. Like all Enigma commands,...
Definition EnigmaString.h:177
@ ParseToGlyphs
Parse accidental insert commands into glyph font changes and character strings.
@ Substitute
Substitute accidental insert commands with textual representations.
std::function< bool(const std::string &text, const EnigmaStyles &styles)> TextChunkCallback
Iteration function type that the parser calls back when the font has changed or when recursively pars...
Definition EnigmaString.h:332
static bool parseEnigmaText(const std::shared_ptr< dom::Document > &document, dom::Cmper forPartId, const std::string &rawText, const TextChunkCallback &onText, const EnigmaParsingOptions &options={}, const EnigmaParsingContext *parsingContext=nullptr)
Simplified version of parseEnigmaText that strips unhandled inserts. Useful in particular when the ca...
Definition EnigmaString.h:391
static std::vector< std::string > parseComponents(const std::string &input, size_t *parsedLength=nullptr)
Parses an enigma text insert into its constituent components.
Definition EnigmaString.cpp:145
std::function< std::optional< std::string >(const std::vector< std::string > &parsedCommand)> TextInsertCallback
Iteration function type that the parser calls back when it encounters an Enigma text insert that requ...
Definition EnigmaString.h:345
AccidentalInsertSymbolType
Insert symbol types for accidentals.
Definition Options.h:1469
std::shared_ptr< const T > MusxInstance
Defines the type of a musx instance stored in a pool.
Definition MusxInstance.h:39
int32_t Evpu
EVPU value (288 per inch)
Definition Fundamentals.h:57
uint16_t Cmper
Enigma "comperator" key type.
Definition Fundamentals.h:55
object model for musx file (enigmaxml)
Definition BaseClasses.h:36
Options for configuring how Enigma strings are parsed.
Definition EnigmaString.h:248
bool ignoreStyleTags
If value is true, font & style tags are ignored. Note that you may still get get font and style chang...
Definition EnigmaString.h:284
EnigmaParsingOptions()
constructor
Definition EnigmaString.h:250
EnigmaParsingOptions(AccidentalStyle accidentalStyle)
constructor for accidental substitution
Definition EnigmaString.h:255
AccidentalStyle substitutionStyle
Specifies the accidental substitution style used when insertHandling is Substitute.
Definition EnigmaString.h:273
std::unordered_set< std::string_view > ignoreTags
Skip tags in this set. Primarily used by the "partname" insert to avoid a situation where the partnam...
Definition EnigmaString.h:291
AccidentalInsertHandling insertHandling
Specifies how accidental insert commands are handled during parsing.
Definition EnigmaString.h:265
bool stripUnknownTags
Specifies whether to strip unknown tags or dump them into the output string.
Definition EnigmaString.h:278
Text styles for enigma strings.
Definition EnigmaString.h:53
EnigmaStyles(const std::weak_ptr< dom::Document > &document)
constructor
Definition EnigmaString.h:69
std::shared_ptr< dom::FontInfo > font
the font to use
Definition EnigmaString.h:82
CategoryTracking
Specifies is the current enigma style tracks an expressions marking category font....
Definition EnigmaString.h:61
@ NumberFont
tracks the category's number font (not implemented in Finale U.I.)
@ TextFont
tracks the category's text font
@ MusicFont
tracks the category's music font
int tracking
inter-character tracking in EMs (1/1000 font size)
Definition EnigmaString.h:86
EnigmaStyles createDeepCopy() const
Creates a deep copy of the styles, including copying any shared pointer instances.
Definition EnigmaString.h:75
dom::Evpu superscript
superscript setting added to baseline (positive means up)
Definition EnigmaString.h:85
dom::Evpu baseline
baseline setting (positive means up)
Definition EnigmaString.h:84
CategoryTracking categoryFont
how this font is tracked against a marking category
Definition EnigmaString.h:83