Question

У нас есть служба C # Windows, которая в настоящее время обрабатывает все PDF-файлы, считывая 2D-штрих-код в PDF с помощью стороннего компонента, а затем обновляет базу данных и сохраняет документ в хранилище документов.

Есть лиКак я могу вырезать файлы после считывания штрих-кода и сохранить его как другой документ?

Например, если есть 10-страничный документ, он должен разбиваться на 10 разных файлов.

Спасибо.

user1788053 · Answer 1 · 08 ноября 2012

Я встретил тот же вопрос, вы можете использовать itextsharp компонент инструменты для разделения документа

public Split(String[] args)
    {
        if (args.Length != 4) 
        {
            Console.Error.WriteLine("This tools needs 4 parameters:\njava Split srcfile destfile1 destfile2 pagenumber");
        }
        else 
        {
            try 
            {
                int pagenumber = int.Parse(args[3]);

                // we create a reader for a certain document
                PdfReader reader = new PdfReader(args[0]);
                // we retrieve the total number of pages
                int n = reader.NumberOfPages;
                Console.WriteLine("There are " + n + " pages in the original file.");

                if (pagenumber < 2 || pagenumber > n) 
                {
                    throw new DocumentException("You can't split this document at page " + pagenumber + "; there is no such page.");
                }

                // step 1: creation of a document-object
                Document document1 = new Document(reader.GetPageSizeWithRotation(1));
                Document document2 = new Document(reader.GetPageSizeWithRotation(pagenumber));
                // step 2: we create a writer that listens to the document
                PdfWriter writer1 = PdfWriter.GetInstance(document1, new FileStream(args[1], FileMode.Create));
                PdfWriter writer2 = PdfWriter.GetInstance(document2, new FileStream(args[2], FileMode.Create));
                // step 3: we open the document
                document1.Open();
                PdfContentByte cb1 = writer1.DirectContent;
                document2.Open();
                PdfContentByte cb2 = writer2.DirectContent;
                PdfImportedPage page;
                int rotation;
                int i = 0;
                // step 4: we add content
                while (i < pagenumber - 1) 
                {
                    i++;
                    document1.SetPageSize(reader.GetPageSizeWithRotation(i));
                    document1.NewPage();
                    page = writer1.GetImportedPage(reader, i);
                    rotation = reader.GetPageRotation(i);
                    if (rotation == 90 || rotation == 270) 
                    {
                        cb1.AddTemplate(page, 0, -1f, 1f, 0, 0, reader.GetPageSizeWithRotation(i).Height);
                    }
                    else 
                    {
                        cb1.AddTemplate(page, 1f, 0, 0, 1f, 0, 0);
                    }
                }
                while (i < n) 
                {
                    i++;
                    document2.SetPageSize(reader.GetPageSizeWithRotation(i));
                    document2.NewPage();
                    page = writer2.GetImportedPage(reader, i);
                    rotation = reader.GetPageRotation(i);
                    if (rotation == 90 || rotation == 270) 
                    {
                        cb2.AddTemplate(page, 0, -1f, 1f, 0, 0, reader.GetPageSizeWithRotation(i).Height);
                    }
                    else 
                    {
                        cb2.AddTemplate(page, 1f, 0, 0, 1f, 0, 0);
                    }
                    Console.WriteLine("Processed page " + i);
                }
                // step 5: we close the document
                document1.Close();
                document2.Close();
            }
            catch(Exception e) 
            {
                Console.Error.WriteLine(e.Message);
                Console.Error.WriteLine(e.StackTrace);
            }
        }

    }

Marko · Answer 2 · 26 августа 2010

Вы можете использовать библиотеку PDF, например PDFSharp , читать файл, перебирать каждую страницу, добавлять их в новый документ PDF и сохранять их в файловой системе. Затем вы также можете удалить или сохранить оригинал.

Это довольно много кода, но очень простой, и эти примеры должны помочь вам начать.

http://www.pdfsharp.net/wiki/Default.aspx?Page=ConcatenateDocuments-sample&NS=&AspxAutoDetectCookieSupport=1

gyurisc · Answer 3 · 26 августа 2010

Предыдущий вопрос частично отвечает на ваши вопросы - как разделить документы PDF, если вы знаете, где находятся штрих-коды, вы можете легко разделить документы:

Как разделить файл PDF на страницы (желательно C #)

Рекомендуется использовать библиотеку под названием PDFSharp и образец , демонстрирующий разбиение PDF .

Gokuldas.Palapatta · Answer 4 · 24 сентября 2013

public int ExtractPages(string sourcePdfPath, string DestinationFolder)
        {
            int p = 0;
            try
            {
                iTextSharp.text.Document document;
                iTextSharp.text.pdf.PdfReader reader = new iTextSharp.text.pdf.PdfReader(new iTextSharp.text.pdf.RandomAccessFileOrArray(sourcePdfPath), new ASCIIEncoding().GetBytes(""));
                if (!Directory.Exists(sourcePdfPath.ToLower().Replace(".pdf", "")))
                {
                    Directory.CreateDirectory(sourcePdfPath.ToLower().Replace(".pdf", ""));
                }
                else
                {
                    Directory.Delete(sourcePdfPath.ToLower().Replace(".pdf", ""), true);
                    Directory.CreateDirectory(sourcePdfPath.ToLower().Replace(".pdf", ""));
                }

                for (p = 1; p <= reader.NumberOfPages; p++)
                {
                    using (MemoryStream memoryStream = new MemoryStream())
                    {
                        document = new iTextSharp.text.Document();
                        iTextSharp.text.pdf.PdfWriter writer = iTextSharp.text.pdf.PdfWriter.GetInstance(document, memoryStream);
                        writer.SetPdfVersion(iTextSharp.text.pdf.PdfWriter.PDF_VERSION_1_2);
                        writer.CompressionLevel = iTextSharp.text.pdf.PdfStream.BEST_COMPRESSION;
                        writer.SetFullCompression();
                        document.SetPageSize(reader.GetPageSize(p));
                        document.NewPage();
                        document.Open();
                        document.AddDocListener(writer);
                        iTextSharp.text.pdf.PdfContentByte cb = writer.DirectContent;
                        iTextSharp.text.pdf.PdfImportedPage pageImport = writer.GetImportedPage(reader, p);
                        int rot = reader.GetPageRotation(p);
                        if (rot == 90 || rot == 270)
                        {
                            cb.AddTemplate(pageImport, 0, -1.0F, 1.0F, 0, 0, reader.GetPageSizeWithRotation(p).Height);
                        }
                        else
                        {
                            cb.AddTemplate(pageImport, 1.0F, 0, 0, 1.0F, 0, 0);
                        }
                        document.Close();
                        document.Dispose();
                        File.WriteAllBytes(DestinationFolder + "/" + p + ".pdf", memoryStream.ToArray());
                    }
                }
                reader.Close();
                reader.Dispose();
            }
            catch
            {
            }
            finally
            {
                GC.Collect();
            }
            return p - 1;

        }

вызовите эту функцию где угодно и передайте путь к папке источника и назначения

Ruben Suardi · Answer 5 · 16 января 2018

    public  void SplitPDFByBookMark(string fileName)
    {
        string sInFile = fileName;
        var pdfReader = new PdfReader(sInFile);
        try
        {
            IList<Dictionary<string, object>> bookmarks = SimpleBookmark.GetBookmark(pdfReader);

            for (int i = 0; i < bookmarks.Count; ++i)
            {
                IDictionary<string, object> BM = (IDictionary<string, object>)bookmarks[i];
                IDictionary<string, object> nextBM = i == bookmarks.Count - 1 ? null : bookmarks[i + 1];

                string startPage = BM["Page"].ToString().Split(' ')[0].ToString();
                string startPageNextBM = nextBM == null ? "" + (pdfReader.NumberOfPages + 1) : nextBM["Page"].ToString().Split(' ')[0].ToString();
                SplitByBookmark(pdfReader, int.Parse(startPage), int.Parse(startPageNextBM), bookmarks[i].Values.ToArray().GetValue(0).ToString() + ".pdf", fileName);

            }
        }
        catch (Exception ex)
        {
            throw ex;
        }
    }

    private void SplitByBookmark(PdfReader reader, int pageFrom, int PageTo, string outPutName, string inPutFileName)
    {
        Document document = new Document();
        using (var fs = new FileStream(Path.GetDirectoryName(inPutFileName) + '\\' + outPutName, System.IO.FileMode.Create))
        {
            try
            {
                using (var writer = PdfWriter.GetInstance(document, fs))
                {
                    document.Open();
                    PdfContentByte cb = writer.DirectContent;
                    //holds pdf data
                    PdfImportedPage page;
                    if (pageFrom == PageTo && pageFrom == 1)
                    {
                        document.NewPage();
                        page = writer.GetImportedPage(reader, pageFrom);
                        cb.AddTemplate(page, 0, 0);
                        pageFrom++;
                        fs.Flush();
                        document.Close();
                        fs.Close();

                    }
                    else
                    {
                        while (pageFrom < PageTo)
                        {
                            document.NewPage();
                            page = writer.GetImportedPage(reader, pageFrom);
                            cb.AddTemplate(page, 0, 0);
                            pageFrom++;
                            fs.Flush();
                            document.Close();
                            fs.Close();
                        }
                    }
                }
                //PdfWriter writer = PdfWriter.GetInstance(document, fs);

            }
            catch (Exception ex)
            {
                throw ex;
            }
        }
    }

Вы можете установить itextsharp из nuget, скопировать и вставить этот код в приложение c #. Вызвать метод SplitPDFByBookMark() и передать имя файла pdf. Этот код будет искать ваши закладки и готово!

Sanjeev Gaur · Answer 6 · 11 февраля 2013

Этот код основан на библиотеке PDFsharp

http://www.pdfsharp.com/PDFsharp/

Если вы хотите разделить по Book Mark, то вот код.

   public static void SplitPDFByBookMark(string fileName)
    {
        string sInFile = fileName;
        PdfReader pdfReader = new PdfReader(sInFile);
        try
        {
            IList<Dictionary<string, object>> bookmarks = SimpleBookmark.GetBookmark(pdfReader);

            for (int i = 0; i < bookmarks.Count; ++i)
            {
                IDictionary<string, object> BM = (IDictionary<string, object>)bookmarks[0];
                IDictionary<string, object> nextBM = i == bookmarks.Count - 1 ? null : bookmarks[i + 1];

                string startPage = BM["Page"].ToString().Split(' ')[0].ToString();
                string startPageNextBM = nextBM == null ? "" + (pdfReader.NumberOfPages + 1) : nextBM["Page"].ToString().Split(' ')[0].ToString();
                SplitByBookmark(pdfReader, int.Parse(startPage), int.Parse(startPageNextBM), bookmarks[i].Values.ToArray().GetValue(0).ToString() + ".pdf", fileName);

            }
        }
        catch (Exception ex)
        {
            throw ex;
        }
    }
    private static void SplitByBookmark(PdfReader reader, int pageFrom, int PageTo, string outPutName, string inPutFileName)
    {
        Document document = new Document();
        FileStream fs = new System.IO.FileStream(System.IO.Path.GetDirectoryName(inPutFileName) + '\\' + outPutName, System.IO.FileMode.Create);

        try
        {

            PdfWriter writer = PdfWriter.GetInstance(document, fs);
            document.Open();
            PdfContentByte cb = writer.DirectContent;
            //holds pdf data
            PdfImportedPage page;
            if (pageFrom == PageTo && pageFrom == 1)
            {
                document.NewPage();
                page = writer.GetImportedPage(reader, pageFrom);
                cb.AddTemplate(page, 0, 0);
                pageFrom++;
                fs.Flush();
                document.Close();
                fs.Close();

            }
            else
            {
                while (pageFrom < PageTo)
                {
                    document.NewPage();
                    page = writer.GetImportedPage(reader, pageFrom);
                    cb.AddTemplate(page, 0, 0);
                    pageFrom++;
                    fs.Flush();
                    document.Close();
                    fs.Close();
                }
            }
        }
        catch (Exception ex)
        {
            throw ex;
        }
        finally
        {
            if (document.IsOpen())
                document.Close();
            if (fs != null)
                fs.Close();
        }

    }

разбить PDF на несколько файлов в C #

Пожалуйста, войдите или зарегистрируйтесь чтобы ответить на этот вопрос.

Ответы [ 6 ]

Пожалуйста, войдите или зарегистрируйтесь что бы добавить комментарий.

Пожалуйста, войдите или зарегистрируйтесь что бы добавить комментарий.

Пожалуйста, войдите или зарегистрируйтесь что бы добавить комментарий.

Пожалуйста, войдите или зарегистрируйтесь что бы добавить комментарий.

Пожалуйста, войдите или зарегистрируйтесь что бы добавить комментарий.

Пожалуйста, войдите или зарегистрируйтесь что бы добавить комментарий.

разбить PDF на несколько файлов в C #

Пожалуйста, войдите или зарегистрируйтесь чтобы ответить на этот вопрос.

Ответы [ 6 ]

Пожалуйста, войдите или зарегистрируйтесь что бы добавить комментарий.

Пожалуйста, войдите или зарегистрируйтесь что бы добавить комментарий.

Пожалуйста, войдите или зарегистрируйтесь что бы добавить комментарий.

Пожалуйста, войдите или зарегистрируйтесь что бы добавить комментарий.

Пожалуйста, войдите или зарегистрируйтесь что бы добавить комментарий.

Пожалуйста, войдите или зарегистрируйтесь что бы добавить комментарий.

Нет похожих вопросов