开发记录5

完成了关键字的提取,自动分类,内容的查重,下面就是对生成PDF格式的检测报告

代码如下:

package com.servlet;

import java.awt.Color;
import java.io.FileOutputStream;
import java.text.DecimalFormat;
import java.util.Arrays;
import java.util.HashSet;
import java.util.List;

import com.dao.InformationDao;
import com.lowagie.text.Chapter;
import com.lowagie.text.Chunk;
import com.lowagie.text.Document;
import com.lowagie.text.Font;
import com.lowagie.text.PageSize;
import com.lowagie.text.Paragraph;
import com.lowagie.text.Phrase;
import com.lowagie.text.pdf.BaseFont;
import com.lowagie.text.pdf.PdfWriter;
import com.model.Information;

public class WriteFile {
    private static int normal = Font.NORMAL; // 正常字体
    private static Color black = new Color(0, 0, 0); // 黑色
    private static Color red = new Color(255, 0, 0); // 红色
    private int bold = Font.BOLD; // 粗体
    private Color blue = new Color(0, 0, 255); // 蓝色
    private float setting = 20; // 首行缩进参数
    static int count=0;//用红色标注的字体个数
    static int cop_count=0;//用红色标注的片段个数
    static int sum=0;//总字数

    public static void main(String[] args) throws Exception {
        WriteFile pdfDemo = new WriteFile();
        pdfDemo.writePdf("E:\20163587_姚雅丽\大型数据库技术与应用\信息技术手册检测报告.pdf");
        System.out.println("写入完成!");
    }
    public void write() throws Exception {
        WriteFile pdfDemo = new WriteFile();
        pdfDemo.writePdf("E:\20163587_姚雅丽\大型数据库技术与应用\信息技术手册检测报告.pdf");
        System.out.println("写入完成!");
    }
    /*
    public void writeone(String title,int index) throws Exception {
        WriteFile pdfDemo = new WriteFile();
        pdfDemo.writePdfone("E:\20163587_姚雅丽\大型数据库技术与应用\"+title+"信息技术手册检测报告.pdf",title,index);
        System.out.println("写入完成!");
    }*/
    public static Document createDoc(String filename) throws Exception {

        Document document = new Document(PageSize.A4, 50, 50, 50, 50);
        PdfWriter.getInstance(document, new FileOutputStream(filename));
        return document;
    }

    public void writePdf(String filename) throws Exception {
        InformationDao indao=new InformationDao();
        List<String> copys=indao.loadCopyAll();
        HashSet h = new HashSet(copys);
        copys.clear();
        copys.addAll(h);
        int length=0;
        int pianduan=0;
        for(String copy:copys)
        {
            length+=copy.length();
            pianduan++;
        }
        int sum2=0;
        List<Information> infoss=indao.loadAll();
        for (Information info : infoss) {
            sum2+=info.getContent().length();
        }
        Document document = createDoc(filename); // 打开文档
        document.open(); // 文档里写入
        Chunk chunk1 = new Chunk(convertChunkToChinese("信息技术手册检测报告", 20, bold, black));
        document.add(chunk1);
        document.add(new Paragraph("
"));
        Paragraph pp = new Paragraph(convertParToChinese("检测范围:◎百度词条", 9, normal, black));
        document.add(pp);
        Paragraph pp1 = new Paragraph(convertParToChinese("颜色标注说", 9, normal, black));
        document.add(pp1);
        Paragraph pp2 = new Paragraph();
        pp2.add(new Phrase(convertParToChinese("口", 9, normal, red)));
        pp2.add(new Phrase(convertParToChinese(":复写片段(相似或疑似重)", 9, normal, black)));
        document.add(pp2);
        //InformationDao indao=new InformationDao();
        document.add(new Paragraph(convertParToChinese("检测结论:",22, normal, black)));
        Paragraph a1=new Paragraph();
        a1.add(new Phrase(convertParToChinese("全文相似度:", 9, normal, black)));
        sum();
        DecimalFormat decimalFormat=new DecimalFormat(".00");//构造方法的字符格式这里如果小数不足2位,会以0补足.
        String p=decimalFormat.format((float)100*length/sum2);
        System.out.println(p);
        a1.add(new Phrase(convertParToChinese(p+"%", 9, normal, red)));
        document.add(a1);
        document.add(new Paragraph(convertParToChinese("总相似片段:" +pianduan, 9, normal, black)));
        List<Information> infos=indao.loadAll();
        for (Information info : infos) {
            Paragraph chapterTitle = new Paragraph("

");
            Paragraph p0 = new Paragraph(convertParToChinese(info.getIndex() + "." + info.getTitle(), 14, bold, black));
            chapterTitle.add(p0);
            Paragraph p3 = new Paragraph(convertParToChinese("类别:" + info.getType(), 9, normal, blue));
            chapterTitle.add(p3);
            //Paragraph p = new Paragraph(convertParToChinese("摘要:" + , 9, normal, blue));
            //chapterTitle.add(p);
            Paragraph p1 = new Paragraph(convertParToChinese("关键词:" + info.getKeyword(), 9, normal, blue));
            chapterTitle.add(p1);
            Paragraph p2 = returnCopy(info.getIndex(), info.getContent());// 解释
            chapterTitle.add(p2);
            document.add(chapterTitle);
        }
        document.add(new Paragraph("

"));
        
        document.close();
        count=0;
        sum=0;
        cop_count=0;
    }
    /*
    public void writePdfone(String filename,String title,int index) throws Exception {
        
        
        Document document = createDoc(filename); // 打开文档
        document.open(); // 文档里写入
        Chunk chunk1 = new Chunk(convertChunkToChinese(title+"信息技术手册检测报告", 20, bold, black));
        document.add(chunk1);
        document.add(new Paragraph("
"));
        Paragraph pp = new Paragraph(convertParToChinese("检测范围:◎百度词条", 9, normal, black));
        document.add(pp);
        Paragraph pp1 = new Paragraph(convertParToChinese("颜色标注说", 9, normal, black));
        document.add(pp1);
        Paragraph pp2 = new Paragraph();
        pp2.add(new Phrase(convertParToChinese("口", 9, normal, red)));
        pp2.add(new Phrase(convertParToChinese(":复写片段(相似或疑似重)", 9, normal, black)));
        document.add(pp2);
        InformationDao indao=new InformationDao();
        Information info=indao.load(index);
            Paragraph chapterTitle = new Paragraph("

");
            Paragraph p0 = new Paragraph(convertParToChinese(info.getIndex() + "." + info.getTitle(), 14, bold, black));
            chapterTitle.add(p0);
            Paragraph p3 = new Paragraph(convertParToChinese("类别:" + info.getType(), 9, normal, blue));
            chapterTitle.add(p3);
            //Paragraph p = new Paragraph(convertParToChinese("摘要:" + , 9, normal, blue));
            //chapterTitle.add(p);
            Paragraph p1 = new Paragraph(convertParToChinese("关键词:" + info.getKeyword(), 9, normal, blue));
            chapterTitle.add(p1);
            Paragraph p2 = returnExpain(info.getIndex(), info.getContent());// 解释
            chapterTitle.add(p2);
            document.add(chapterTitle);
        document.add(new Paragraph("

"));
        document.add(new Paragraph(convertParToChinese("检测结论:",22, normal, black)));
        Paragraph a1=new Paragraph();
        a1.add(new Phrase(convertParToChinese("全文相似度:", 9, normal, black)));
        sum();
        DecimalFormat decimalFormat=new DecimalFormat(".00");//构造方法的字符格式这里如果小数不足2位,会以0补足.
        String p=decimalFormat.format((float)100*count/sum);
        System.out.println(p);
        a1.add(new Phrase(convertParToChinese(p+"%", 9, normal, red)));
        document.add(a1);
        document.add(new Paragraph(convertParToChinese("总相似片段:" +cop_count, 9, normal, black)));
        count=0;
        sum=0;
        cop_count=0;
        document.close();
    }
    */
    //返回词语解释部分
    public static Paragraph returnCopy(int index, String explain) throws Exception
    {
        int chaoxi=0;//抄袭字数
        int pianduan=0;//抄袭片段
        int zongzishu=0;//总字数
        Paragraph a = new Paragraph();
        InformationDao indao=new InformationDao();
        List<String> copys=indao.loadCopy(index);
        HashSet h = new HashSet(copys);
        copys.clear();
        copys.addAll(h);
        System.out.println(copys);
        int pos[]=new int[100];
        int x=0;
        for(String copy:copys)
        {
            pos[x]=explain.indexOf(copy);
            x++;    
        }
        Arrays.sort(pos);
        
        for(int i=0;i<explain.length();i++)
        {
            String word="";
            //word = word+explain.charAt(i);
            //a.add(new Phrase(convertParToChinese2(word, 12, normal, black)));
            int max=0;
            boolean b=true;
            
            for(int position:pos)
            {
                if(i==position)//判断是否到达抄袭点
                {
                    b=false;//到达抄袭点
                }
            }
            if(b==false)
            {
                String cop="";
                for(String copy:copys)
                {
                    if(explain.indexOf(copy)==i)
                    {
                        cop=copy;
                    }
                }
                a.add(new Phrase(convertParToChinese2(cop, 12, normal, red)));
                chaoxi+=cop.length();
                pianduan++;
                i=i+cop.length();
            }
            word = word+explain.charAt(i);
            a.add(new Phrase(convertParToChinese2(word, 12, normal, black)));
            
        }
        a.add(new Paragraph(convertParToChinese("检测结论:",22, normal, black)));
        Paragraph a1=new Paragraph();
        a1.add(new Phrase(convertParToChinese("全文相似度:", 9, normal, black)));
        sum();
        DecimalFormat decimalFormat=new DecimalFormat(".00");//构造方法的字符格式这里如果小数不足2位,会以0补足.
        String p=decimalFormat.format((float)100*chaoxi/explain.length());
        System.out.println(p);
        a1.add(new Phrase(convertParToChinese(p+"%", 9, normal, red)));
        a.add(a1);
        a.add(new Paragraph(convertParToChinese("总相似片段:" +pianduan, 9, normal, black)));
        return a;
        
    }
    /*
    public static Paragraph returnExpain(int index, String explain) throws Exception {
        InformationDao indao=new InformationDao();
        String copy=indao.loadcpoy(index);
        String[]copys=copy.split("¢");
        Paragraph a = new Paragraph();
        String word = "";
        int j = 0;
        if (copy.length()!=0) 
        {
            if(copys.length==1)
            {
                String c = copys[j];
                //j++;
                //System.out.println(index);
                for (int i = 0; i < explain.length(); i++) 
                { 
                    int position=explain.indexOf(copys[0]);

                    if (i < position) 
                    {
                        //System.out.println("姚雅丽");
                        word = word + explain.charAt(i);
                        //System.out.println(word);
                        
                    } 
                    else if (i==position) 
                    {
                            System.out.println(word);
                            a.add(new Phrase(convertParToChinese2(word, 12, normal, black)));
                            a.add(new Phrase(convertParToChinese2(copys[0], 12, normal, red)));
                            count+=copys[0].length();
                            cop_count++;
                            word = "";
                    }
                    else if(i>=position+copys[0].length())
                    {
                        word = word + explain.charAt(i);
                        a.add(new Phrase(convertParToChinese2(word, 12, normal, black)));
                        word = "";
                    }
                }
            }
            else
            {
            String c = copys[j];
            //j++;
            //System.out.println(index);
            for (int i = 0; i < explain.length(); i++) 
            { 
                int position=explain.indexOf(copys[0]);
                int pos2=explain.indexOf(copys[1]);
                int min=0;
                int max=0;
                String one="";
                String two="";
                if(position<pos2)
                {
                    min=position;
                    one=copys[0];
                    two=copys[1];
                    max=pos2;
                }
                else
                {
                    max=position;
                    min=pos2;
                    two=copys[0];
                    one=copys[1];
                }
                if (i < min) 
                {
                    //System.out.println("姚雅");
                    word = word + explain.charAt(i);
                    
                } 
                else if (i==min) 
                {
                        a.add(new Phrase(convertParToChinese2(word, 12, normal, black)));
                        a.add(new Phrase(convertParToChinese2(one, 12, normal, red)));
                        cop_count++;
                        count+=one.length();
                        word = "";
                }
                else if (min+one.length()<=i&&i<max) 
                {
                        word = word + explain.charAt(i);
                        a.add(new Phrase(convertParToChinese2(word, 12, normal, black)));
                        word = "";
                    
                }else if(i==max)
                {
                     word = word + explain.charAt(i);
                     a.add(new Phrase(convertParToChinese2(two, 12, normal, red)));
                     cop_count++;
                     count+=two.length();
                     word = "";
                }
                else if(i>=max+two.length()&&i<explain.length()-1)
                {
                    word = word + explain.charAt(i);
                }
                else if(i==explain.length()-1)
                {
                    word = word + explain.charAt(i);
                    a.add(new Phrase(convertParToChinese2(word, 12, normal, black)));
                }

            }
            }
        } 
        else 
        {
            //System.out.println("姚雅丽");
            a = new Paragraph(convertParToChinese(explain, 12, normal, black));
        }
        return a;

    }
    */
    public static void sum() {
        InformationDao indao=new InformationDao();
        List<Information> infos=indao.loadAll();
        for(Information info:infos) {
            sum=sum+info.getContent().length();
        }
        
    }
    
    public static Paragraph convertParToChinese(String text, int fontsize, int fontStyle, Color color)
            throws Exception {
        BaseFont baseFontChinese = BaseFont.createFont("STSong-Light", "UniGB-UCS2-H", BaseFont.NOT_EMBEDDED);
        Font fontChinese = new Font(baseFontChinese, fontsize, fontStyle, color);
        Paragraph graph = new Paragraph(text, fontChinese);
        return graph;
    }

    public static Phrase convertParToChinese2(String text, int fontsize, int fontStyle, Color color) throws Exception {
        BaseFont baseFontChinese = BaseFont.createFont("STSong-Light", "UniGB-UCS2-H", BaseFont.NOT_EMBEDDED);
        Font fontChinese = new Font(baseFontChinese, fontsize, fontStyle, color);
        Phrase graph = new Phrase(text, fontChinese);
        return graph;
    }

    public static Chunk convertChunkToChinese(String text, int fontsize, int fontStyle, Color color) throws Exception {
        BaseFont baseFontChinese = BaseFont.createFont("STSong-Light", "UniGB-UCS2-H", BaseFont.NOT_EMBEDDED);
        Font fontChinese = new Font(baseFontChinese, fontsize, fontStyle, color);
        Chunk graph = new Chunk(text, fontChinese);
        return graph;
    }
}

参考文章:https://home.cnblogs.com/u/wl2017/