Book a Demo!
CoCalc Logo Icon
StoreFeaturesDocsShareSupportNewsAboutPoliciesSign UpSign In
stenzek
GitHub Repository: stenzek/duckstation
Path: blob/master/dep/lzma/include/Ppmd.h
4253 views
1
/* Ppmd.h -- PPMD codec common code
2
2023-03-05 : Igor Pavlov : Public domain
3
This code is based on PPMd var.H (2001): Dmitry Shkarin : Public domain */
4
5
#ifndef ZIP7_INC_PPMD_H
6
#define ZIP7_INC_PPMD_H
7
8
#include "CpuArch.h"
9
10
EXTERN_C_BEGIN
11
12
#if defined(MY_CPU_SIZEOF_POINTER) && (MY_CPU_SIZEOF_POINTER == 4)
13
/*
14
PPMD code always uses 32-bit internal fields in PPMD structures to store internal references in main block.
15
if (PPMD_32BIT is defined), the PPMD code stores internal pointers to 32-bit reference fields.
16
if (PPMD_32BIT is NOT defined), the PPMD code stores internal UInt32 offsets to reference fields.
17
if (pointer size is 64-bit), then (PPMD_32BIT) mode is not allowed,
18
if (pointer size is 32-bit), then (PPMD_32BIT) mode is optional,
19
and it's allowed to disable PPMD_32BIT mode even if pointer is 32-bit.
20
PPMD code works slightly faster in (PPMD_32BIT) mode.
21
*/
22
#define PPMD_32BIT
23
#endif
24
25
#define PPMD_INT_BITS 7
26
#define PPMD_PERIOD_BITS 7
27
#define PPMD_BIN_SCALE (1 << (PPMD_INT_BITS + PPMD_PERIOD_BITS))
28
29
#define PPMD_GET_MEAN_SPEC(summ, shift, round) (((summ) + (1 << ((shift) - (round)))) >> (shift))
30
#define PPMD_GET_MEAN(summ) PPMD_GET_MEAN_SPEC((summ), PPMD_PERIOD_BITS, 2)
31
#define PPMD_UPDATE_PROB_0(prob) ((prob) + (1 << PPMD_INT_BITS) - PPMD_GET_MEAN(prob))
32
#define PPMD_UPDATE_PROB_1(prob) ((prob) - PPMD_GET_MEAN(prob))
33
34
#define PPMD_N1 4
35
#define PPMD_N2 4
36
#define PPMD_N3 4
37
#define PPMD_N4 ((128 + 3 - 1 * PPMD_N1 - 2 * PPMD_N2 - 3 * PPMD_N3) / 4)
38
#define PPMD_NUM_INDEXES (PPMD_N1 + PPMD_N2 + PPMD_N3 + PPMD_N4)
39
40
MY_CPU_pragma_pack_push_1
41
/* Most compilers works OK here even without #pragma pack(push, 1), but some GCC compilers need it. */
42
43
/* SEE-contexts for PPM-contexts with masked symbols */
44
typedef struct
45
{
46
UInt16 Summ; /* Freq */
47
Byte Shift; /* Speed of Freq change; low Shift is for fast change */
48
Byte Count; /* Count to next change of Shift */
49
} CPpmd_See;
50
51
#define Ppmd_See_UPDATE(p) \
52
{ if ((p)->Shift < PPMD_PERIOD_BITS && --(p)->Count == 0) \
53
{ (p)->Summ = (UInt16)((p)->Summ << 1); \
54
(p)->Count = (Byte)(3 << (p)->Shift++); }}
55
56
57
typedef struct
58
{
59
Byte Symbol;
60
Byte Freq;
61
UInt16 Successor_0;
62
UInt16 Successor_1;
63
} CPpmd_State;
64
65
typedef struct CPpmd_State2_
66
{
67
Byte Symbol;
68
Byte Freq;
69
} CPpmd_State2;
70
71
typedef struct CPpmd_State4_
72
{
73
UInt16 Successor_0;
74
UInt16 Successor_1;
75
} CPpmd_State4;
76
77
MY_CPU_pragma_pop
78
79
/*
80
PPMD code can write full CPpmd_State structure data to CPpmd*_Context
81
at (byte offset = 2) instead of some fields of original CPpmd*_Context structure.
82
83
If we use pointers to different types, but that point to shared
84
memory space, we can have aliasing problem (strict aliasing).
85
86
XLC compiler in -O2 mode can change the order of memory write instructions
87
in relation to read instructions, if we have use pointers to different types.
88
89
To solve that aliasing problem we use combined CPpmd*_Context structure
90
with unions that contain the fields from both structures:
91
the original CPpmd*_Context and CPpmd_State.
92
So we can access the fields from both structures via one pointer,
93
and the compiler doesn't change the order of write instructions
94
in relation to read instructions.
95
96
If we don't use memory write instructions to shared memory in
97
some local code, and we use only reading instructions (read only),
98
then probably it's safe to use pointers to different types for reading.
99
*/
100
101
102
103
#ifdef PPMD_32BIT
104
105
#define Ppmd_Ref_Type(type) type *
106
#define Ppmd_GetRef(p, ptr) (ptr)
107
#define Ppmd_GetPtr(p, ptr) (ptr)
108
#define Ppmd_GetPtr_Type(p, ptr, note_type) (ptr)
109
110
#else
111
112
#define Ppmd_Ref_Type(type) UInt32
113
#define Ppmd_GetRef(p, ptr) ((UInt32)((Byte *)(ptr) - (p)->Base))
114
#define Ppmd_GetPtr(p, offs) ((void *)((p)->Base + (offs)))
115
#define Ppmd_GetPtr_Type(p, offs, type) ((type *)Ppmd_GetPtr(p, offs))
116
117
#endif // PPMD_32BIT
118
119
120
typedef Ppmd_Ref_Type(CPpmd_State) CPpmd_State_Ref;
121
typedef Ppmd_Ref_Type(void) CPpmd_Void_Ref;
122
typedef Ppmd_Ref_Type(Byte) CPpmd_Byte_Ref;
123
124
125
/*
126
#ifdef MY_CPU_LE_UNALIGN
127
// the unaligned 32-bit access latency can be too large, if the data is not in L1 cache.
128
#define Ppmd_GET_SUCCESSOR(p) ((CPpmd_Void_Ref)*(const UInt32 *)(const void *)&(p)->Successor_0)
129
#define Ppmd_SET_SUCCESSOR(p, v) *(UInt32 *)(void *)(void *)&(p)->Successor_0 = (UInt32)(v)
130
131
#else
132
*/
133
134
/*
135
We can write 16-bit halves to 32-bit (Successor) field in any selected order.
136
But the native order is more consistent way.
137
So we use the native order, if LE/BE order can be detected here at compile time.
138
*/
139
140
#ifdef MY_CPU_BE
141
142
#define Ppmd_GET_SUCCESSOR(p) \
143
( (CPpmd_Void_Ref) (((UInt32)(p)->Successor_0 << 16) | (p)->Successor_1) )
144
145
#define Ppmd_SET_SUCCESSOR(p, v) { \
146
(p)->Successor_0 = (UInt16)(((UInt32)(v) >> 16) /* & 0xFFFF */); \
147
(p)->Successor_1 = (UInt16)((UInt32)(v) /* & 0xFFFF */); }
148
149
#else
150
151
#define Ppmd_GET_SUCCESSOR(p) \
152
( (CPpmd_Void_Ref) ((p)->Successor_0 | ((UInt32)(p)->Successor_1 << 16)) )
153
154
#define Ppmd_SET_SUCCESSOR(p, v) { \
155
(p)->Successor_0 = (UInt16)((UInt32)(v) /* & 0xFFFF */); \
156
(p)->Successor_1 = (UInt16)(((UInt32)(v) >> 16) /* & 0xFFFF */); }
157
158
#endif
159
160
// #endif
161
162
163
#define PPMD_SetAllBitsIn256Bytes(p) \
164
{ size_t z; for (z = 0; z < 256 / sizeof(p[0]); z += 8) { \
165
p[z+7] = p[z+6] = p[z+5] = p[z+4] = p[z+3] = p[z+2] = p[z+1] = p[z+0] = ~(size_t)0; }}
166
167
EXTERN_C_END
168
169
#endif
170
171