XXS攻击，HTML代码注入

最新推荐文章于 2024-09-08 12:26:59 发布

郭优秀的笔记

最新推荐文章于 2024-09-08 12:26:59 发布

阅读量2.8k

点赞数 1

分类专栏： Java

本文链接：https://blog.csdn.net/guoYLong/article/details/88416310

版权

Java 专栏收录该内容

40 篇文章 1 订阅

订阅专栏

XSS, 即为（Cross Site Scripting）, 中文名为跨站脚本,XSS是一种经常出现在web应用中的计算机安全漏洞，它允许恶意web用户将代码植入到提供给其它用户使用的页面中。比如这些代码包括HTML代码和客户端脚本。攻击者利用XSS漏洞旁路掉访问控制——例如同源策略(same origin policy)。

针对现在很多企业级开发的同学，避免不了页面进行编辑，或者评论，或者是富文本编辑等操作，只要涉及到这些操作，就要防止非法入侵，下面可以分享一下自己在开发中遇到的这种情况，直接上工具类：

package com.***.****.admin.utils;

import java.util.regex.Matcher;
import java.util.regex.Pattern;

public class DelHtmlTagUtils {

    // 输入框的过滤
    public static String delHTMLTag(String htmlStr) {
        if (htmlStr != null && htmlStr.length() > 0) {
            String regExscript = "<script[^>]*?>[\\s\\S]*?<\\/script>"; // 定义script的正则表达式
            String regExstyle = "<style[^>]*?>[\\s\\S]*?<\\/style>"; // 定义style的正则表达式
            String regExHtml = "&lt;script.*?&gt;.*?&lt;/script&gt;"; // 定义转义后script标签的正则表达式
            String regExHtml1 = "&lt;script.*?&gt;"; // 定义转义后script标签的正则表达式
            String regExHtml2 = "&lt;/script&gt;"; // 定义转义后script标签的正则表达式
            String regExHtml3 = "script"; // 定义转义后script标签的正则表达式
            String regExHtml4 = "javascript";
            String regExHtml5 = "eval\\((.*)\\)";
            String regExHtml6 = "<[^>]+>";
            String regExHtml7 = "<>";
            String regExHtml8 = "src[\r\n]*=[\r\n]*\\\'(.*?)\\\'";
            String regExHtml10 = "&lt;[^>]*on.*?&gt;";
            String regExHtml11 = "&lt;/[^>]*on.*&gt;";
            String regExHtml13 = "<a[^>]*?>[\\s\\S]*?<\\/a>";
            String regExHtml14 = "<iframe[^>]*?>[\\s\\S]*?<\\/iframe>";
            String regExHtml15 = "&lt;a.*?&gt;.*?&lt;/a&gt;"; // 定义转义后script标签的正则表达式
            String regExHtml16 = "&lt;iframe.*?&gt;.*?&lt;/iframe&gt;";

            Pattern pScript = Pattern.compile(regExscript, Pattern.CASE_INSENSITIVE);
            Matcher mScript = pScript.matcher(htmlStr);
            htmlStr = mScript.replaceAll(""); // 过滤

            Pattern pStyle = Pattern.compile(regExstyle, Pattern.CASE_INSENSITIVE);
            Matcher mStyle = pStyle.matcher(htmlStr);
            htmlStr = mStyle.replaceAll(""); // 过滤style标签

            Pattern pHtml = Pattern.compile(regExHtml, Pattern.CASE_INSENSITIVE);
            Matcher mHtml = pHtml.matcher(htmlStr);
            htmlStr = mHtml.replaceAll(""); // 过滤转义后script标签

            Pattern pHtml1 = Pattern.compile(regExHtml1, Pattern.CASE_INSENSITIVE);
            Matcher mHtml1 = pHtml1.matcher(htmlStr);
            htmlStr = mHtml1.replaceAll(""); // 过滤转义后script标签

            Pattern pHtml2 = Pattern.compile(regExHtml2, Pattern.CASE_INSENSITIVE);
            Matcher mHtml2 = pHtml2.matcher(htmlStr);
            htmlStr = mHtml2.replaceAll(""); // 过滤转义后script标签

            Pattern pHtml3 = Pattern.compile(regExHtml3, Pattern.CASE_INSENSITIVE);
            Matcher mHtml3 = pHtml3.matcher(htmlStr);
            htmlStr = mHtml3.replaceAll(""); // 过滤script标签

            Pattern pHtml4 = Pattern.compile(regExHtml4, Pattern.CASE_INSENSITIVE);
            Matcher mHtml4 = pHtml4.matcher(htmlStr);
            htmlStr = mHtml4.replaceAll(""); // 过滤javascript标签

            Pattern pHtml5 = Pattern.compile(regExHtml5, Pattern.CASE_INSENSITIVE);
            Matcher mHtml5 = pHtml5.matcher(htmlStr);
            htmlStr = mHtml5.replaceAll(""); // 过滤eval标签

            Pattern pHtml6 = Pattern.compile(regExHtml6, Pattern.CASE_INSENSITIVE);
            Matcher mHtml6 = pHtml6.matcher(htmlStr);
            htmlStr = mHtml6.replaceAll(""); // 过滤html标签

            Pattern pHtml7 = Pattern.compile(regExHtml7, Pattern.CASE_INSENSITIVE);
            Matcher mHtml7 = pHtml7.matcher(htmlStr);
            htmlStr = mHtml7.replaceAll(""); // 过滤html标签

            Pattern pHtml8 = Pattern.compile(regExHtml8, Pattern.CASE_INSENSITIVE);
            Matcher mHtml8 = pHtml8.matcher(htmlStr);
            htmlStr = mHtml8.replaceAll(""); // 过滤html标签

            Pattern pHtml10 = Pattern.compile(regExHtml10, Pattern.CASE_INSENSITIVE);
            Matcher mHtml10 = pHtml10.matcher(htmlStr);
            htmlStr = mHtml10.replaceAll("");

            Pattern pHtml11 = Pattern.compile(regExHtml11, Pattern.CASE_INSENSITIVE);
            Matcher mHtml11 = pHtml11.matcher(htmlStr);
            htmlStr = mHtml11.replaceAll("");

            Pattern pHtml13 = Pattern.compile(regExHtml13, Pattern.CASE_INSENSITIVE);
            Matcher mHtml13 = pHtml13.matcher(htmlStr);
            htmlStr = mHtml13.replaceAll("");

            Pattern pHtml14 = Pattern.compile(regExHtml14, Pattern.CASE_INSENSITIVE);
            Matcher mHtml14 = pHtml14.matcher(htmlStr);
            htmlStr = mHtml14.replaceAll("");

            Pattern pHtml15 = Pattern.compile(regExHtml15, Pattern.CASE_INSENSITIVE);
            Matcher mHtml15 = pHtml15.matcher(htmlStr);
            htmlStr = mHtml15.replaceAll("");

            Pattern pHtml16 = Pattern.compile(regExHtml16, Pattern.CASE_INSENSITIVE);
            Matcher mHtml16 = pHtml16.matcher(htmlStr);
            htmlStr = mHtml16.replaceAll("");

            return htmlStr.trim(); // 返回文本字符串
        } else {
            return htmlStr;
        }
    }
}

上面是一个我写的一个工具类，直接调用在前端输入框可以过滤掉工具类中有写的js，script标签等

下面的是HTML过滤，具体根据你们自己的业务需求去更改

package ***.***.***.util;

import java.util.regex.Matcher;
import java.util.regex.Pattern;


public class HTMLUtils {

/**
 * 过滤所有HTML 标签
 * @param htmlStr
 * @return
 */
public static String filterHTMLTag(String htmlStr) {


    //定义HTML标签的正则表达式 
    String reg_html="<[^>]+>"; 
    Pattern pattern=Pattern.compile(reg_html,Pattern.CASE_INSENSITIVE); 
    Matcher matcher=pattern.matcher(htmlStr); 
    htmlStr=matcher.replaceAll(""); //过滤html标签 
    return htmlStr;
}

/**
 * 过滤标签，通过标签名
 * @param htmlStr
 * @param tagName
 * @return
 */
public static String filterTagByName(String htmlStr,String tagName) {

    String reg_html="<"+tagName+"[^>]*?>[\\s\\S]*?<\\/"+tagName+">";
    Pattern pattern=Pattern.compile(reg_html,Pattern.CASE_INSENSITIVE); 
    Matcher matcher=pattern.matcher(htmlStr); 
    htmlStr=matcher.replaceAll(""); //过滤html标签 
    return htmlStr;
}

/**
 * 过滤标签上的 style 样式
 * @param htmlStr
 * @return
 */
public static String filterHTMLTagInStyle(String htmlStr) {
    String reg_html="style=('|\")(.*?)('|\")";
    Pattern pattern=Pattern.compile(reg_html,Pattern.CASE_INSENSITIVE); 
    Matcher matcher=pattern.matcher(htmlStr); 
    htmlStr=matcher.replaceAll(""); //过滤html标签 
    return htmlStr;
}

/**
 * 替换表情
 * @param htmlStr
 * @param tagName
 * @return
 */
public static String replayFace(String htmlStr) {
    String reg_html="\\[em_\\d{1,}\\]";
    Pattern pattern =Pattern.compile(reg_html,Pattern.CASE_INSENSITIVE); 
    Matcher matcher=pattern.matcher(htmlStr);
    if(matcher.find()) {
        matcher.reset();
        while(matcher.find()) {
            String num = matcher.group(0);
            String number=num.substring(num.lastIndexOf('_')+1, num.length()-1);
            htmlStr = htmlStr.replace(num, "<img src='/face/arclist/"+number+".gif' border='0' />");
        }
    }
    return htmlStr;
}

    public static void main(String[] args) {
        String html = "<script>alert('test');</script><img src='/face/arclist/5.gif' border='0' /><div style='position:fixs;s'></div><style>body{color:#fff;}</style><Style>body{color:#fff;}</Style><STYLE>body{color:#fff;}</STYLE>";
        System.out.println("html="+html);
        html = HTMLUtils.filterTagByName(html, "style");
        System.out.println("html="+html);
        html = HTMLUtils.filterTagByName(html, "script");
        System.out.println("html="+html);
        html = HTMLUtils.filterHTMLTagInStyle(html);
        System.out.println("html="+html);
    }

}