Springboot使用AOP结合Redis+Lua脚本分布式限流

1.定义一个限流注解，方便AOP调用#

1
@Target(ElementType.METHOD)
2
@Retention(RetentionPolicy.RUNTIME)
3
@Documented
4
public @interface RateLimiter {
5
    long DEFAULT_REQUEST = 10;
6

7
    /**
8
     * max 最大请求数
9
     */
10
    @AliasFor("max") long value() default DEFAULT_REQUEST;
11

12
    /**
13
     * max 最大请求数
14
     */
15
    @AliasFor("value") long max() default DEFAULT_REQUEST;
16
    //上方写两次是为了等值使用，添加了 AliasFor 必须通过 AnnotationUtils 获取，才会生效
17

18
    /**
19
     * 限流key
20
     */    String key() default "";
21

22
    /**
23
     * 超时时长，默认1分钟
24
     */
25
    long timeout() default 1;
26

27
    /**
28
     * 超时时间单位，默认 分钟
29
     */
30
    TimeUnit timeUnit() default TimeUnit.MINUTES;
31
}

2.切面类#

定义切点表达式，创建pointcut方法，通过方法形参point传入，获取到方法后，通过AnnotationUtils获取方法所携带的注解及其参数，获取最大访问次数max、超时时间timeout，以及时间格式timeUnit，把参数交给限流方法，计算出窗口时间范围expired到now，交给Lua脚本执行

1
@Slf4j
2
@Aspect
3
@Component
4
@RequiredArgsConstructor()
5
public class RateLimiterAspect {
6
    private final static String SEPARATOR = ":";
7
    private final static String REDIS_LIMIT_KEY_PREFIX = "limit:";
8
    private final StringRedisTemplate stringRedisTemplate;
9
    private final RedisScript<Long> limitRedisScript;
10

11
    @Pointcut("@annotation(com.xkcoding.ratelimit.redis.annotation.RateLimiter)")
12
    public void rateLimit() {
13

14
    }
15

16
    @Around("rateLimit()")
17
    public Object pointcut(ProceedingJoinPoint point) throws Throwable {
18
        MethodSignature signature = (MethodSignature) point.getSignature();
19
        Method method = signature.getMethod();
20
        // 通过 AnnotationUtils.findAnnotation 获取 RateLimiter 注解
21
        RateLimiter rateLimiter = AnnotationUtils.findAnnotation(method, RateLimiter.class);
22
        if (rateLimiter != null) {
23
            String key = rateLimiter.key();
24
            // 默认用类名+方法名做限流的 key 前缀
25
            if (StrUtil.isBlank(key)) {
26
                key = method.getDeclaringClass().getName() + StrUtil.DOT + method.getName();
27
            }
28
            // 最终限流的 key 为 前缀 + IP地址
29
            // TODO: 此时需要考虑局域网多用户访问的情况，因此 key 后续需要加上方法参数更加合理 ，其实就是：当前限流 key 只包含了“自定义 key 或类名.方法名”和“IP 地址”，但在局域网环境下，多个用户可能共用同一个外网 IP，导致限流不够精确。为了解决这个问题，建议在 key 中加入方法参数（如用户 ID、请求参数等），这样可以更细粒度地区分不同用户或请求，避免误伤。
30
            key = key + SEPARATOR + IpUtil.getIpAddr();
31

32
            long max = rateLimiter.max();
33
            long timeout = rateLimiter.timeout();
34
            TimeUnit timeUnit = rateLimiter.timeUnit();
35
            boolean limited = shouldLimited(key, max, timeout, timeUnit);
36
            if (limited) {
37
                throw new RuntimeException("手速太快了，慢点儿吧~");
38
            }
39
        }
40

41
        return point.proceed();
42
    }
43

44
    private boolean shouldLimited(String key, long max, long timeout, TimeUnit timeUnit) {
45
        // 最终的 key 格式为：
46
        // limit:自定义key:IP
47
        // limit:类名.方法名:IP
48
        key = REDIS_LIMIT_KEY_PREFIX + key;
49
        // 统一使用单位毫秒
50
        long ttl = timeUnit.toMillis(timeout);
51
        // 当前时间毫秒数
52
        long now = Instant.now().toEpochMilli();
53
        long expired = now - ttl;
54
        // 注意这里必须转为 String,否则会报错 java.lang.Long cannot be cast to java.lang.String
55
      Long executeTimes = stringRedisTemplate.execute(limitRedisScript, Collections.singletonList(key), now + "", ttl + "", expired + "", max + "");
56
        if (executeTimes != null) {
57
            if (executeTimes == 0) {
58
                log.error("【{}】在单位时间 {} 毫秒内已达到访问上限，当前接口上限 {}", key, ttl, max);
59
                return true;
60
            } else {
61
                log.info("【{}】在单位时间 {} 毫秒内访问 {} 次", key, ttl, executeTimes);
62
                return false;
63
            }
64
        }
65
        return false;
66
    }
67
}

3.Lua脚本#

1
-- 下标从 1 开始
2
local key = KEYS[1]
3
local now = tonumber(ARGV[1])
4
local ttl = tonumber(ARGV[2])
5
local expired = tonumber(ARGV[3])
6
-- 最大访问量
7
local max = tonumber(ARGV[4])
8

9
-- 清除过期的数据
10
-- 移除指定分数区间内的所有元素，expired 即已经过期的 score-- 根据当前时间毫秒数 - 超时毫秒数，得到过期时间
11
expiredredis.call('zremrangebyscore', key, 0, expired)
12

13
-- 获取 zset 中的当前元素个数
14
local current = tonumber(redis.call('zcard', key))
15
local next = current + 1
16

17
if next > max then
18
  -- 达到限流大小 返回 0  return 0;
19
else
20
  -- 往 zset 中添加一个值、得分均为当前时间戳的元素，[value,score]
21
  redis.call("zadd", key, now, now)
22
  -- 每次访问均重新设置 zset 的过期时间，单位毫秒
23
  redis.call("pexpire", key, ttl)
24
  return next
25
end

获取参数，使用滑动窗口动态计算，首先删除不在窗口范围内的数据，然后使用计数器计算窗口内数据+当前数据总数与最大访问数据做比较，如果大于max，说明当前时间段数据超限了，返回0，不再继续访问该数据否则就把当前数据插进去，并重新设置key过期时间（延长timeout时间），这是为了防止多个用户在访问该接口一次后再也不访问了，key永久存在，就算超时了数据也会存在，因为用户没有第二次访问数据，也就没有移除指定分数区间内的所有元素，是为了”僵尸Key”问题，而不是”过期数据”问题。它确保即使用户再也不访问，相关的限流Key也能在timeout后自动清理，避免Redis中累积大量无用的空Key。。顺带说一句，就算key为空他也是占内存的，Redis需要去维护，

4.其它#

为什么Redis数据结构要使用zset实现限流？#

使用 ZSET 的核心原因是要实现滑动时间窗口限流。

核心需求#

限流需要判断：在过去N秒内，是否已经有超过M次请求

ZSET 的优势#

1. 存储时间戳#

1
-- ZSET 同时存储时间戳作为 value 和 score
2
zadd key 1697788800000 1697788800000  -- [时间戳, 时间戳]

2. 高效清理过期数据#

1
-- 一条命令删除所有过期请求记录
2
redis.call('zremrangebyscore', key, 0, expired)

3. 快速统计当前请求数#

1
-- 直接获取有效请求数量
2
local current = redis.call('zcard', key)

对比其他方案#

STRING 计数器： 只能固定时间窗口，无法滑动 LIST： 清理过期数据效率低，需要逐个检查 HASH： 需要手动维护时间字段，复杂度高

实现效果#

1
窗口=60秒，限制=5次
2

3
时间轴: 10:00:00  10:00:30  10:01:00  10:01:10
4
请求:     ①②③      ④⑤       检查      ⑥
5

6
在 10:01:10 检查时：
7
├─ 删除 10:00:10 之前的请求 (①②③被删除)
8
├─ 保留 ④⑤ (在窗口内)
9
├─ 当前计数=2，允许⑥通过

ZSET 让滑动窗口限流变得简单高效，这是选择它的根本原因。

为什么要用lua脚本，而不是java代码实现#

使用 Lua 脚本而不是 Java 代码实现限流逻辑，主要有以下几个关键原因：

1. 保证操作的原子性#

说明的是，如果ip级别的限流，他们的key是各不相同的，所以用java代码实现也能保证原子性

Java 代码的问题（非原子性）：#

1
// ❌ 这些操作不是原子的，存在竞态条件
2
stringRedisTemplate.opsForZSet().removeRangeByScore(key, 0, expired);  // 操作1
3
Long current = stringRedisTemplate.opsForZSet().zCard(key);             // 操作2
4
if (current < max) {
5
    stringRedisTemplate.opsForZSet().add(key, now, now);                // 操作3
6
    stringRedisTemplate.expire(key, ttl, TimeUnit.MILLISECONDS);        // 操作4
7
}

并发问题示例：#

1
时间线：用户A 和 用户B 同时访问（当前计数=4，限制=5）
2

3
用户A：removeRangeByScore → current=4 → 判断通过 → [被中断]
4
用户B：removeRangeByScore → current=4 → 判断通过 → zadd → 计数=5
5
用户A：[继续] → zadd → 计数=6 ❌ 超出限制！

Lua 脚本的优势（原子性）：#

1
-- ✅ 整个脚本作为一个原子操作执行
2
redis.call('zremrangebyscore', key, 0, expired)
3
local current = tonumber(redis.call('zcard', key))
4
-- 中间不会被其他请求打断
5
redis.call("zadd", key, now, now)

2. 减少网络往返次数#

Java 代码：#

1
// ❌ 需要 3-4 次网络往返
2
stringRedisTemplate.opsForZSet().removeRangeByScore(key, 0, expired);  // 网络往返1
3
Long current = stringRedisTemplate.opsForZSet().zCard(key);             // 网络往返2
4
stringRedisTemplate.opsForZSet().add(key, now, now);                    // 网络往返3
5
stringRedisTemplate.expire(key, ttl, TimeUnit.MILLISECONDS);           // 网络往返4

Lua 脚本：#

1
-- ✅ 只需要 1 次网络往返
2
-- 所有操作在 Redis 服务器端执行

3. 性能优势#

高并发场景下的差异：#

1
1000个并发请求的情况：
2

3
Java 实现：
4
├─ 网络往返：1000 × 4 = 4000次
5
├─ 竞态条件：可能导致限流失效
6
└─ 响应时间：较慢
7

8
Lua 脚本：
9
├─ 网络往返：1000 × 1 = 1000次
10
├─ 原子操作：限流严格有效
11
└─ 响应时间：更快

4. 避免分布式锁#

如果用 Java 实现，需要加锁：#

1
// ❌ 复杂且性能差
2
String lockKey = "lock:" + key;
3
try {
4
    // 获取分布式锁
5
    if (redisLock.tryLock(lockKey, 100, TimeUnit.MILLISECONDS)) {
6
        // 执行限流逻辑
7
        // ...
8
    }
9
} finally {
10
    redisLock.unlock(lockKey);
11
}

Lua 脚本天然避免了这个问题：#

1
-- ✅ 不需要显式加锁，Redis 保证脚本原子执行

5. 事务一致性#

Lua 脚本确保限流判断和计数更新在同一个事务中：

1
-- 判断和操作是一体的，不会出现：
2
-- "判断时未超限，但执行时已超限" 的情况
3
if next > max then
4
  return 0;
5
else
6
  redis.call("zadd", key, now, now)
7
  return next
8
end

总结#

Lua 脚本的核心优势：

✅ 原子性：避免竞态条件
✅ 高性能：减少网络往返
✅ 简洁：无需分布式锁
✅ 准确性：严格的限流控制

优化：惩罚机制和风控策略#

你的观点很对！当前的限流实现确实比较基础，只是简单地拒绝请求。在实际生产环境中，需要更完善的惩罚机制和风控策略。

当前实现的局限性#

1
// 当前逻辑：超出限制就直接抛异常
2
if (limited) {
3
    throw new RuntimeException("手速太快了，慢点儿吧~");
4
}

问题：

❌ 无惩罚机制：用户可以一直尝试
❌ 无封禁逻辑：恶意用户成本很低
❌ 无分级处理：所有超限都是同等处理

改进方案：分级惩罚机制#

1. 增强的注解定义#

1
@Target(ElementType.METHOD)
2
@Retention(RetentionPolicy.RUNTIME)
3
public @interface RateLimiter {
4
    // 原有参数
5
    long max() default 5;
6
    long timeout() default 1;
7
    TimeUnit timeUnit() default TimeUnit.MINUTES;
8

9
    // 新增惩罚机制参数
10
    boolean enablePunishment() default false;        // 是否启用惩罚
11
    long warningThreshold() default 10;              // 警告阈值
12
    long banThreshold() default 20;                  // 封禁阈值
13
    long banDuration() default 30;                   // 封禁时长
14
    TimeUnit banTimeUnit() default TimeUnit.MINUTES; // 封禁时间单位
15
}

2. 分级处理逻辑#

1
@Service
2
public class EnhancedRateLimiterService {
3

4
    private static final String VIOLATION_KEY_PREFIX = "violation:";
5
    private static final String BAN_KEY_PREFIX = "ban:";
6

7
    public RateLimitResult checkRateLimit(String key, RateLimiter config) {
8
        // 1. 检查是否被封禁
9
        if (isBanned(key)) {
10
            return RateLimitResult.banned("用户已被封禁");
11
        }
12

13
        // 2. 执行正常限流检查
14
        boolean normalLimited = executeNormalRateLimit(key, config);
15

16
        if (!normalLimited) {
17
            return RateLimitResult.allowed();
18
        }
19

20
        // 3. 记录违规次数
21
        long violationCount = recordViolation(key);
22

23
        // 4. 根据违规次数分级处理
24
        if (config.enablePunishment()) {
25
            return handleViolation(key, violationCount, config);
26
        }
27

28
        return RateLimitResult.rejected("请求过于频繁");
29
    }
30

31
    private RateLimitResult handleViolation(String key, long count, RateLimiter config) {
32
        if (count >= config.banThreshold()) {
33
            // 封禁用户
34
            banUser(key, config.banDuration(), config.banTimeUnit());
35
            return RateLimitResult.banned("违规次数过多，已被封禁 " +
36
                config.banDuration() + " " + config.banTimeUnit().name().toLowerCase());
37

38
        } else if (count >= config.warningThreshold()) {
39
            // 警告
40
            return RateLimitResult.warning("警告：继续违规将被封禁，当前违规次数：" + count);
41
        }
42

43
        return RateLimitResult.rejected("请求过于频繁，违规次数：" + count);
44
    }
45
}

3. Lua 脚本增强#

1
-- enhanced_rate_limit.lua
2
local key = KEYS[1]
3
local violation_key = KEYS[2]
4
local ban_key = KEYS[3]
5

6
local now = tonumber(ARGV[1])
7
local ttl = tonumber(ARGV[2])
8
local expired = tonumber(ARGV[3])
9
local max = tonumber(ARGV[4])
10
local ban_duration = tonumber(ARGV[5])
11
local ban_threshold = tonumber(ARGV[6])
12

13
-- 检查是否被封禁
14
local ban_expire = redis.call('GET', ban_key)
15
if ban_expire and tonumber(ban_expire) > now then
16
    return {-1, tonumber(ban_expire) - now} -- 返回剩余封禁时间
17
end
18

19
-- 正常限流逻辑
20
redis.call('zremrangebyscore', key, 0, expired)
21
local current = tonumber(redis.call('zcard', key))
22

23
if current < max then
24
    redis.call("zadd", key, now, now)
25
    redis.call("pexpire", key, ttl)
26
    return {current + 1, 0}
27
else
28
    -- 记录违规
29
    local violation_count = redis.call('INCR', violation_key)
30
    redis.call('EXPIRE', violation_key, 3600) -- 违规记录1小时过期
31

32
    -- 检查是否需要封禁
33
    if violation_count >= ban_threshold then
34
        redis.call('SET', ban_key, now + ban_duration)
35
        redis.call('EXPIRE', ban_key, ban_duration / 1000)
36
        return {-2, ban_duration} -- 触发封禁
37
    end
38

39
    return {0, violation_count} -- 返回违规次数
40
end

4. 控制器中的使用#

1
@RestController
2
public class EnhancedTestController {
3

4
    @RateLimiter(
5
        max = 5,
6
        timeout = 1,
7
        timeUnit = TimeUnit.MINUTES,
8
        enablePunishment = true,
9
        warningThreshold = 3,
10
        banThreshold = 5,
11
        banDuration = 30,
12
        banTimeUnit = TimeUnit.MINUTES
13
    )
14
    @GetMapping("/test1")
15
    public ResponseEntity<Dict> test1() {
16
        return ResponseEntity.ok(
17
            Dict.create()
18
                .set("msg", "hello,world!")
19
                .set("description", "正常访问")
20
        );
21
    }
22
}

5. 结果类型定义#

1
@Data
2
@AllArgsConstructor
3
public class RateLimitResult {
4
    private boolean allowed;
5
    private String message;
6
    private long remainingTime; // 剩余封禁时间（秒）
7
    private int violationCount; // 违规次数
8

9
    public static RateLimitResult allowed() {
10
        return new RateLimitResult(true, "允许访问", 0, 0);
11
    }
12

13
    public static RateLimitResult banned(String message) {
14
        return new RateLimitResult(false, message, 0, 0);
15
    }
16

17
    public static RateLimitResult warning(String message) {
18
        return new RateLimitResult(true, message, 0, 0);
19
    }
20
}

效果展示#

1
用户访问轨迹：
2

3
第1-5次：正常返回数据
4
第6次：  "请求过于频繁，违规次数：1"
5
第7次：  "请求过于频繁，违规次数：2"
6
第8次：  "警告：继续违规将被封禁，当前违规次数：3"
7
第9次：  "警告：继续违规将被封禁，当前违规次数：4"
8
第10次： "违规次数过多，已被封禁 30 minutes"
9

10
接下来30分钟内的所有请求：
11
"用户已被封禁，剩余时间：XX分钟"

这样的机制能够：

✅ 递进式惩罚：从警告到封禁
✅ 震慑效果：增加恶意访问成本
✅ 保护系统：防止资源被滥用
✅ 用户体验：给正常用户提供清晰的反馈