You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
Copy file name to clipboardExpand all lines: src/sdk/models/shared/partitionparameters.ts
+36
Original file line number
Diff line number
Diff line change
@@ -175,6 +175,22 @@ export type PartitionParameters = {
175
175
* Deprecated! Use skip_infer_table_types to opt out of table extraction for any file type. If False and strategy=hi_res, no Table Elements will be extracted from pdf files regardless of skip_infer_table_types contents.
176
176
*/
177
177
pdfInferTableStructure?: boolean|undefined;
178
+
/**
179
+
* If two characters are closer together than this margin they are considered part of the same line. The margin is specified relative to the width of the character.
180
+
*/
181
+
pdfminerCharMargin?: number|null|undefined;
182
+
/**
183
+
* If two lines are close together they are considered to be part of the same paragraph. The margin is specified relative to the height of a line.
184
+
*/
185
+
pdfminerLineMargin?: number|null|undefined;
186
+
/**
187
+
* If two characters have more overlap than this they are considered to be on the same line. The overlap is specified relative to the minimum height of both characters.
188
+
*/
189
+
pdfminerLineOverlap?: number|null|undefined;
190
+
/**
191
+
* If two characters on the same line are further apart than this margin then they are considered to be two separate words, and an intermediate space will be added for readability. The margin is specified relative to the width of the character.
192
+
*/
193
+
pdfminerWordMargin?: number|null|undefined;
178
194
/**
179
195
* A value between 0.0 and 1.0 describing the minimum similarity two elements must have to be included in the same chunk. Note that similar elements may be separated to meet chunk-size criteria; this value can only guarantees that two elements with similarity below the threshold will appear in separate chunks.
0 commit comments