| OLD | NEW |
| 1 // Copyright 2014 PDFium Authors. All rights reserved. | 1 // Copyright 2014 PDFium Authors. All rights reserved. |
| 2 // Use of this source code is governed by a BSD-style license that can be | 2 // Use of this source code is governed by a BSD-style license that can be |
| 3 // found in the LICENSE file. | 3 // found in the LICENSE file. |
| 4 | 4 |
| 5 // Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com | 5 // Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com |
| 6 | 6 |
| 7 #include "../../include/fpdfapi/fpdf_page.h" | 7 #include "../../include/fpdfapi/fpdf_page.h" |
| 8 #include "../../include/fpdfapi/fpdf_pageobj.h" | 8 #include "../../include/fpdfapi/fpdf_pageobj.h" |
| 9 #include "../../include/fpdftext/fpdf_text.h" | 9 #include "../../include/fpdftext/fpdf_text.h" |
| 10 #include "txtproc.h" | 10 #include "txtproc.h" |
| (...skipping 205 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 216 CTextBaseLine* pPrevLine = (CTextBaseLine*)m_BaseLines.GetAt(i - 1); | 216 CTextBaseLine* pPrevLine = (CTextBaseLine*)m_BaseLines.GetAt(i - 1); |
| 217 if (pBaseLine->CanMerge(pPrevLine)) { | 217 if (pBaseLine->CanMerge(pPrevLine)) { |
| 218 pPrevLine->Merge(pBaseLine); | 218 pPrevLine->Merge(pBaseLine); |
| 219 delete pBaseLine; | 219 delete pBaseLine; |
| 220 m_BaseLines.RemoveAt(i); | 220 m_BaseLines.RemoveAt(i); |
| 221 i --; | 221 i --; |
| 222 } | 222 } |
| 223 } | 223 } |
| 224 if (m_bAutoWidth) { | 224 if (m_bAutoWidth) { |
| 225 int* widths = FX_Alloc(int, m_BaseLines.GetSize()); | 225 int* widths = FX_Alloc(int, m_BaseLines.GetSize()); |
| 226 if (widths) { | 226 for (i = 0; i < m_BaseLines.GetSize(); i ++) { |
| 227 for (i = 0; i < m_BaseLines.GetSize(); i ++) { | 227 widths[i] = 0; |
| 228 widths[i] = 0; | 228 CTextBaseLine* pBaseLine = (CTextBaseLine*)m_BaseLines.GetAt(i); |
| 229 CTextBaseLine* pBaseLine = (CTextBaseLine*)m_BaseLines.GetAt(i); | 229 int TotalChars = 0; |
| 230 int TotalChars = 0; | 230 FX_FLOAT TotalWidth = 0; |
| 231 FX_FLOAT TotalWidth = 0; | 231 int minchars; |
| 232 int minchars; | 232 pBaseLine->CountChars(TotalChars, TotalWidth, minchars); |
| 233 pBaseLine->CountChars(TotalChars, TotalWidth, minchars); | 233 if (TotalChars) { |
| 234 if (TotalChars) { | 234 FX_FLOAT charwidth = TotalWidth / TotalChars; |
| 235 FX_FLOAT charwidth = TotalWidth / TotalChars; | 235 widths[i] = (int)((MaxRightX - MinLeftX) / charwidth); |
| 236 widths[i] = (int)((MaxRightX - MinLeftX) / charwidth); | |
| 237 } | |
| 238 if (widths[i] > 1000) { | |
| 239 widths[i] = 1000; | |
| 240 } | |
| 241 if (widths[i] < minchars) { | |
| 242 widths[i] = minchars; | |
| 243 } | |
| 244 } | 236 } |
| 245 int AvgWidth = 0, widthcount = 0; | 237 if (widths[i] > 1000) { |
| 246 for (i = 0; i < m_BaseLines.GetSize(); i ++) | 238 widths[i] = 1000; |
| 247 if (widths[i]) { | |
| 248 AvgWidth += widths[i]; | |
| 249 widthcount ++; | |
| 250 } | |
| 251 AvgWidth = int((FX_FLOAT)AvgWidth / widthcount + 0.5); | |
| 252 int MaxWidth = 0; | |
| 253 for (i = 0; i < m_BaseLines.GetSize(); i ++) | |
| 254 if (MaxWidth < widths[i]) { | |
| 255 MaxWidth = widths[i]; | |
| 256 } | |
| 257 if (MaxWidth > AvgWidth * 6 / 5) { | |
| 258 MaxWidth = AvgWidth * 6 / 5; | |
| 259 } | 239 } |
| 260 FX_Free(widths); | 240 if (widths[i] < minchars) { |
| 261 if (iMinWidth < MaxWidth) { | 241 widths[i] = minchars; |
| 262 iMinWidth = MaxWidth; | |
| 263 } | 242 } |
| 264 } | 243 } |
| 244 int AvgWidth = 0, widthcount = 0; |
| 245 for (i = 0; i < m_BaseLines.GetSize(); i ++) |
| 246 if (widths[i]) { |
| 247 AvgWidth += widths[i]; |
| 248 widthcount ++; |
| 249 } |
| 250 AvgWidth = int((FX_FLOAT)AvgWidth / widthcount + 0.5); |
| 251 int MaxWidth = 0; |
| 252 for (i = 0; i < m_BaseLines.GetSize(); i ++) |
| 253 if (MaxWidth < widths[i]) { |
| 254 MaxWidth = widths[i]; |
| 255 } |
| 256 if (MaxWidth > AvgWidth * 6 / 5) { |
| 257 MaxWidth = AvgWidth * 6 / 5; |
| 258 } |
| 259 FX_Free(widths); |
| 260 if (iMinWidth < MaxWidth) { |
| 261 iMinWidth = MaxWidth; |
| 262 } |
| 265 } | 263 } |
| 266 for (i = 0; i < m_BaseLines.GetSize(); i ++) { | 264 for (i = 0; i < m_BaseLines.GetSize(); i ++) { |
| 267 CTextBaseLine* pBaseLine = (CTextBaseLine*)m_BaseLines.GetAt(i); | 265 CTextBaseLine* pBaseLine = (CTextBaseLine*)m_BaseLines.GetAt(i); |
| 268 pBaseLine->MergeBoxes(); | 266 pBaseLine->MergeBoxes(); |
| 269 } | 267 } |
| 270 if (m_bKeepColumn) { | 268 if (m_bKeepColumn) { |
| 271 FindColumns(); | 269 FindColumns(); |
| 272 } | 270 } |
| 273 for (i = 0; i < m_BaseLines.GetSize(); i ++) { | 271 for (i = 0; i < m_BaseLines.GetSize(); i ++) { |
| 274 CTextBaseLine* pBaseLine = (CTextBaseLine*)m_BaseLines.GetAt(i); | 272 CTextBaseLine* pBaseLine = (CTextBaseLine*)m_BaseLines.GetAt(i); |
| (...skipping 496 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 771 { | 769 { |
| 772 buffer.EstimateSize(0, 10240); | 770 buffer.EstimateSize(0, 10240); |
| 773 CPDF_Page page; | 771 CPDF_Page page; |
| 774 page.Load(pDoc, pPage); | 772 page.Load(pDoc, pPage); |
| 775 CPDF_ParseOptions options; | 773 CPDF_ParseOptions options; |
| 776 options.m_bTextOnly = TRUE; | 774 options.m_bTextOnly = TRUE; |
| 777 options.m_bSeparateForm = FALSE; | 775 options.m_bSeparateForm = FALSE; |
| 778 page.ParseContent(&options); | 776 page.ParseContent(&options); |
| 779 _PDF_GetTextStream_Unicode(buffer, &page, TRUE, NULL); | 777 _PDF_GetTextStream_Unicode(buffer, &page, TRUE, NULL); |
| 780 } | 778 } |
| OLD | NEW |