blob: 9d5ba8afcf6a7259b3d8da06a98d6fe7119b9788 (
plain) (
blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
|
// Copyright Vespa.ai. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root.
#pragma once
#include <vespa/vespalib/stllike/string.h>
namespace juniper::separators {
// Separators used in strings passed to juniper.
// UTF-8 encoded separarators
extern vespalib::string interlinear_annotation_anchor_string;
extern vespalib::string interlinear_annotation_separator_string;
extern vespalib::string interlinear_annotation_terminator_string;
extern vespalib::string group_separator_string;
extern vespalib::string record_separator_string;
extern vespalib::string unit_separator_string;
// UTF-32 separators
constexpr char32_t interlinear_annotation_anchor = U'\xfff9';
constexpr char32_t interlinear_annotation_separator = U'\xfffa';
constexpr char32_t interlinear_annotation_terminator = U'\xfffb';
// The GS character used to separate paragraphs
constexpr char8_t group_separator = u8'\x1d';
// The RS character
constexpr char8_t record_separator = u8'\x1e';
// The US character used to separate words in CJK texts
constexpr char8_t unit_separator = u8'\x1f';
}
|