Python发生IndexError错误如何解决？

Python运行代码发生异常: IndexError如何解决？

list index out of range
  File "D:\ai2.py", line 21, in get_cat1_songlist_last_page
    last_page_url = "https://music.163.com" + all_pages_urls[-1].split('"')[1]
  File "D:\ai2.py", line 53, in find_cat1_cat2_songlist
    url, num = get_cat1_songlist_last_page(cat1)
  File "D:\ai2.py", line 127, in <module>
    url = find_cat1_cat2_songlist("华语", "新歌")
IndexError: list index out of range

代码如下
```python
import re
import requests
import json
import openpyxl
from openpyxl.drawing.image import Image
wb = openpyxl.Workbook()
sheet = wb.active

def get_cat1_songlist_last_page(cat1: str):
    url = 'https://music.163.com/discover/playlist/?cat=' + cat1
    headers = {
'Cookie': '__e_=1515461191756; _ntes_nnid=af802a7dd2cafc9fef605185da6e73fb,1515461190617; _ntes_nuid=af802a7dd2cafc9fef605185da6e73fb;JSESSIONID-WYYY=HMyeRdf98eDm%2Bi%5CRnK9iB%5ChcSODhA%2Bh4jx5t3z20hhwTRsOCWhBS5Cpn%2B5j%5CVfMIu0i4bQY9sky%5CsvMmHhuwud2cDNbFRD%2FHhWHE61VhovnFrKWXfDAp%5CqO%2B6cEc%2B%2BIXGz83mwrGS78Goo%2BWgsyJb37Oaqr0IehSp288xn5DhgC3Cobe%3A1515585307035; _iuqxldmzr_=32; __utma=94650624.61181594.1515583507.1515583507.1515583507.1; __utmc=94650624; __utmz=94650624.1515583507.1.1.utmcsr=(direct)|utmccn=(direct)|utmcmd=(none); __utmb=94650624.4.10.1515583507',
'Host': 'music.163.com',
'Referer': 'http://music.163.com/',
'Upgrade-Insecure-Requests': '1',
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko)Chrome/63.0.3239.132 Safari/537.36' }
    r = requests.get(url, headers=headers)
    # reg1 = r'<ul class="f-hide"><li><a href="/song\?id=\d*?">.*</a></li></ul>'
    reg1 = r'<a href=".*" class="zpgi">\d*?</a>'
    all_pages_urls = re.compile(reg1).findall(r.text)
    last_page_url = "https://music.163.com" + all_pages_urls[-1].split('"')[1]
    last_page_number = int(all_pages_urls[-1].split('>')[1].split('<')[0])
    return last_page_url, last_page_number


def get_page_songlist_ids(url: str):
    headers = {
'Cookie': '__e_=1515461191756; _ntes_nnid=af802a7dd2cafc9fef605185da6e73fb,1515461190617; _ntes_nuid=af802a7dd2cafc9fef605185da6e73fb;JSESSIONID-WYYY=HMyeRdf98eDm%2Bi%5CRnK9iB%5ChcSODhA%2Bh4jx5t3z20hhwTRsOCWhBS5Cpn%2B5j%5CVfMIu0i4bQY9sky%5CsvMmHhuwud2cDNbFRD%2FHhWHE61VhovnFrKWXfDAp%5CqO%2B6cEc%2B%2BIXGz83mwrGS78Goo%2BWgsyJb37Oaqr0IehSp288xn5DhgC3Cobe%3A1515585307035; _iuqxldmzr_=32; __utma=94650624.61181594.1515583507.1515583507.1515583507.1; __utmc=94650624; __utmz=94650624.1515583507.1.1.utmcsr=(direct)|utmccn=(direct)|utmcmd=(none); __utmb=94650624.4.10.1515583507',
'Host': 'music.163.com',
'Referer': 'http://music.163.com/',
'Upgrade-Insecure-Requests': '1',
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko)Chrome/63.0.3239.132 Safari/537.36' }
    r = requests.get(url, headers=headers)
    reg1 = r'<a title="(.*)" href="/playlist\?id=(\d*?)" class="msk"></a>'
    songlists = re.compile(reg1).findall(r.text)
    songlists_ids = [i[1] for i in songlists]
    reg2 = r'<a href="(.*?)" class="zbtn zprv">上一页</a>'
    nxt_page = re.compile(reg2).findall(r.text)
    return songlists_ids, "https://music.163.com" + nxt_page[0]
def get_songlist_tags(url: str):
    headers = {
'Cookie': '__e_=1515461191756; _ntes_nnid=af802a7dd2cafc9fef605185da6e73fb,1515461190617; _ntes_nuid=af802a7dd2cafc9fef605185da6e73fb;JSESSIONID-WYYY=HMyeRdf98eDm%2Bi%5CRnK9iB%5ChcSODhA%2Bh4jx5t3z20hhwTRsOCWhBS5Cpn%2B5j%5CVfMIu0i4bQY9sky%5CsvMmHhuwud2cDNbFRD%2FHhWHE61VhovnFrKWXfDAp%5CqO%2B6cEc%2B%2BIXGz83mwrGS78Goo%2BWgsyJb37Oaqr0IehSp288xn5DhgC3Cobe%3A1515585307035; _iuqxldmzr_=32; __utma=94650624.61181594.1515583507.1515583507.1515583507.1; __utmc=94650624; __utmz=94650624.1515583507.1.1.utmcsr=(direct)|utmccn=(direct)|utmcmd=(none); __utmb=94650624.4.10.1515583507',
'Host': 'music.163.com',
'Referer': 'http://music.163.com/',
'Upgrade-Insecure-Requests': '1',
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko)Chrome/63.0.3239.132 Safari/537.36' }
    r = requests.get(url, headers=headers)
    reg1 = r'<a class="u-tag" href="/discover/playlist/\?cat=.*"><i>(.*)</i></a>'
    tags = re.compile(reg1).findall(r.text)
    return tags
def find_cat1_cat2_songlist(cat1: str, cat2: str, limit = 1000):
    total = 0
    url, num = get_cat1_songlist_last_page(cat1)
    for i in range(num):
          lists, nxt_page_url = get_page_songlist_ids(url)
          url = nxt_page_url
          cnt = 1
          print("正在搜索第", num, "页", "总共", len(lists), "个歌单")
          for id in lists:
               tags = get_songlist_tags("https://music.163.com/playlist?id=" + str(id))
               print(" 第%2d 个歌单标签为"%(cnt), str(tags), "url = ", "https://music.163.com/playlist?id=" + str(id))
               cnt += 1
               total += 1
               if(cat2 in tags):
                  return "https://music.163.com/playlist?id=" + str(id)
          num -= 1
    
def get_all_hotsongs(url: str):
    headers = {
'Cookie': '__e_=1515461191756; _ntes_nnid=af802a7dd2cafc9fef605185da6e73fb,1515461190617; _ntes_nuid=af802a7dd2cafc9fef605185da6e73fb;JSESSIONID-WYYY=HMyeRdf98eDm%2Bi%5CRnK9iB%5ChcSODhA%2Bh4jx5t3z20hhwTRsOCWhBS5Cpn%2B5j%5CVfMIu0i4bQY9sky%5CsvMmHhuwud2cDNbFRD%2FHhWHE61VhovnFrKWXfDAp%5CqO%2B6cEc%2B%2BIXGz83mwrGS78Goo%2BWgsyJb37Oaqr0IehSp288xn5DhgC3Cobe%3A1515585307035; _iuqxldmzr_=32; __utma=94650624.61181594.1515583507.1515583507.1515583507.1; __utmc=94650624; __utmz=94650624.1515583507.1.1.utmcsr=(direct)|utmccn=(direct)|utmcmd=(none); __utmb=94650624.4.10.1515583507',
'Host': 'music.163.com',
'Referer': 'http://music.163.com/',
'Upgrade-Insecure-Requests': '1',
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko)Chrome/63.0.3239.132 Safari/537.36' }
    r = requests.get(url, headers=headers)
    reg1 = r'<ul class="f-hide"><li><a href="/song\?id=\d*?">.*</a></li></ul>'
    result_contain_songs_ul = re.compile(reg1).findall(r.text)
    result_contain_songs_ul = result_contain_songs_ul[0]
    reg2 = r'<li><a href="/song\?id=\d*?">(.*?)</a></li>'
    reg3 = r'<li><a href="/song\?id=(\d*?)">.*?</a></li>'
    hot_songs_name = re.compile(reg2).findall(result_contain_songs_ul)
    hot_songs_id = re.compile(reg3).findall(result_contain_songs_ul)
    return hot_songs_name, hot_songs_id
def get_avatar(url, path):
    headers = { "Accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.7", "Accept-Encoding": "gzip, deflate", "Accept-Language": "zh-CN,zh;q=0.9,en;q=0.8,en-GB;q=0.7,en-US;q=0.6", "Cache-Control": "no-cache", "Connection": "keep-alive", "Host": "p1.music.126.net", "Pragma": "no-cache", "Upgrade-Insecure-Requests": "1", "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko)Chrome/125.0.0.0 Safari/537.36 Edg/125.0.0.0"
}
    r = requests.get(url, headers=headers)
    with open(path, "wb") as f:
         f.write(r.content)
def get_hotcommnets(hot_songs_name, hot_songs_id):
    url = 'http://music.163.com/weapi/v1/resource/comments/R_SO_4_' + hot_songs_id + '?csrf_token='
    headers = {
'Host': 'music.163.com',
'Proxy-Connection': 'keep-alive',
'Origin': 'http://music.163.com',
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko)',
'Content-Type': 'application/x-www-form-urlencoded',
'Accept': '*/*',
'Referer': 'http://music.163.com/song?id=' + hot_songs_id + '',
'Accept-Encoding': 'gzip, deflate',
'Accept-Language': 'zh,zh-TW;q=0.9,en-US;q=0.8,en;q=0.7',
'Cookie': '__e_=1515461191756; _ntes_nnid=af802a7dd2cafc9fef605185da6e73fb,1515461190617; _ntes_nuid=af802a7dd2cafc9fef605185da6e73fb; _iuqxldmzr_=32; __utmc=94650624; __utmz=94650624.1515628584.2.2.utmcsr=baidu|utmccn=(organic)|utmcmd=organic;JSESSIONID-WYYY=TO%2BtUvrTWONNwB%2BgzDpfjFDiggKiS%2FfpMYNam%2BWGooHNka%2BwMhdsT%5CY%2Fn%2FpSMJwo4skFIK1T%2FNjd95lbGHWMQr5d5qcMRPB9SVKWK8UuBs1OGugZ4lFwipwjwWbCepSw%5CjWv31i1Qt%5CWWwtrFzzktj8CdCzniAw%5CgFCElUJnsQygY0MA%3A1515635604215; __utma=94650624.61181594.1515583507.1515630648.1515633862.4; __utmb=94650624.2.10.1515633862' }
    data = {
'params':
'cG5yxYo1s0E9Eqv4QWJLM0fdPiJr0+GfKwqcGPulhOtGJ16gEBopaMhe6XeVNKDigMlpCaV7vrDNQLIOPIaTpAjlcJv +hjdCek6nL0ODfHt9ZEmtkTmU4r/+SA6Vno+o+c4EaPvhghNUXRMdVM/LltKvVanwOSvVhcqUPw9qij1d1akcxweLOWf1hKh2/q/m',
'encSecKey':
'a6c21ac04a44dca0e68174f9dfa85537a2694ecf7b43bdcd46a90836209a3d68008b430b54751bc0f56b12b6da38a265afcef1edbf687d70d1eb853144e920fea28e19a8c6145b7bad33e40d077e8a689b4bf67b367db815278af4ef227b02d85e609007106b7fc4a547bf96a1b90b0eda85bca6cc79ca6fc6559d00060d4184' }
    response = requests.post(url, data=data, headers=headers)
    hotcomments = json.loads(response.text)['hotComments']
    sheet.column_dimensions['F'].width = 256
    for i in range(len(hotcomments)):
          user_name = hotcomments[i]['user']['nickname']
          comment = hotcomments[i]['content']
          like_num = hotcomments[i]['likedCount']
          avatar_url = hotcomments[i]['user']['avatarUrl']
          x = [hot_songs_name, hot_songs_id, user_name, comment, like_num]
          sheet.append(x)
          lst_row = sheet.max_row
          lst_col = sheet.max_column
    
          imgPath = "D:/pachong/img" + str(lst_row) + ".jpg"
          get_avatar(avatar_url + "?param=256y256", imgPath)
          img = Image(imgPath)
          sheet.row_dimensions[lst_row].height = 256
          sheet.add_image(img, "F" + str(lst_row))
          
url = find_cat1_cat2_songlist("华语", "新歌")
hot_songs_name, hot_songs_id = get_all_hotsongs(url)
num = 0
while num < len(hot_songs_name):
    print('正在抓取网易云音乐第%d 首歌曲热评...' % (num + 1))
    get_hotcommnets(hot_songs_name[num], hot_songs_id[num])
    print('第%d 首歌曲热评抓取成功' % (num + 1))
    num += 1
wb.save(filename='Formular1.xlsx')

写回答
好问题 0 提建议
关注问题
分享
邀请回答
编辑收藏删除
收藏举报

19条回答默认最新

关注

码龄粉丝数原力等级 --

被采纳

被点赞

采纳率
yy64ll826 2024-06-04 15:22
关注
【Python】成功解决IndexError: list index out of range
https://zhuanlan.zhihu.com/p/692009787

本回答被题主选为最佳回答 , 对您是否有帮助呢?

解决无用
评论打赏
分享
举报

评论

按下Enter换行，Ctrl+Enter发表内容

查看更多回答(18条)

报告相同问题？

关注问题

【Python编程】常见错误合集与解决方案：典型错误示例及详细解决方法了Python编程中
2025-06-03 21:41

内容概要：本文档《常见错误合集与解决方案.pdf》详细介绍了Python编程中常见的错误及其解决方法。涵盖了多种类型的错误，包括但不限于索引错误（IndexError）、类型错误（TypeError）、属性错误（AttributeError）...
索引错误全解：Python IndexError与KeyError处理
2025-12-08 20:23

二川bro的博客索引错误全解：Python IndexError与KeyError处理
python异常错误怎么看？
2023-04-15 09:38

Pengsen Ma的博客注意这句话 During handling of the above exception, another exception occurred: 它的意思是:在处理上述异常期间，发生了另一个异常：简单理解就是执行try中的代码出现错误，然后执行except 中的代码，在执行...
Python 编程入门与算法进阶三级知识点教案
2024-04-29 21:18

掌握这些基础知识对于学习任何编程语言都至关重要。 - **二进制**：二进制是计算机内部使用的数制，只有0和1两个数字。在Python中，可以通过`bin()`函数将十进制数转换成二进制字符串形式，例如`bin(10)`将返回`'0b...
【Python】解决Python错误报错：IndexError: tuple index out of range
2024-05-30 14:23

I'mAlex的博客解决python报错：IndexError: tuple index out of range
【Python】解决Python报错：IndexError: string index out of range错误
2024-05-30 10:11

I'mAlex的博客解决Python报错：IndexError: string index out of range错误
少儿编程-电子学会Python考级三级知识点汇总
2024-05-31 15:02

### 少儿编程-电子学会Python考级三级知识点汇总 #### 一、编码数制 **1. 编码** - **定义**: 指的是信息从一种形式转换为另一种形式的过程。 - **重要性**: 在计算机科学中极为重要，尤其是在数据传输和存储...
【python】Python报错分析：深入探索`IndexError`及其解决办法
2024-07-12 15:19

景天科技苑的博客 Python报错分析：深入探索`IndexError`及其解决办法
【Python 已解决】列表索引超出范围–Python 中的IndexError: list index out of range 错误
2024-07-17 21:10

二川bro的博客【Python 已解决】列表索引超出范围–Python 中的IndexError: list index out of range 错误
【Python】解决Python报错：IndexError: list index out of range
2024-06-07 13:51

E绵绵的博客通过理解列表的索引机制和确保在安全的范围内访问索引，可以有效预防和解决错误。希望本文提供的策略和实例能帮助你在日常编程中避免此类错误，编写更加健壮的Python代码。
Python 常见的 10 个错误及其解决方法
2024-01-06 20:00

Sitin涛哥的博客更多Python学习内容：ipengtao.com当编写 Python 代码时，难免会遇到各种错误和异常。...在本文中，将深入探讨 Python 中的一些常见错误，包括错误类型、原因和解决方法，以帮助你更好地理解和处理这些问题。
Python中IndexError的索引越界问题：从根源到解决方案
2025-07-01 09:49

喜欢编程就关注我的博客本文系统介绍了Python中IndexError索引越界问题的成因、典型场景及解决方案。文章首先解析了索引越界的本质，列举了循环越界、动态修改列表等常见错误场景。接着提出防御性编程、异常处理、切片操作和迭代器模式四种...
《Python编程基础》20春期末-参考资料.docx
2023-06-13 14:08

《Python编程基础》课程涵盖了Python语言的基础概念与关键特性，是初学者入门的重要参考资料。以下是一些关键知识点的概述： 1. **数字表示法**：Python支持多种数字表示方式，如`0o20`是八进制表示，转换为十进制...
【Python】解决Python报错：IndexError: pop from empty list
2024-05-30 19:15

I'mAlex的博客解决Python报错：IndexError: pop from empty list
17个新手常见Python运行时错误.docx
2022-04-26 11:57

Python 语言是一种易于学习的编程语言，但是新手常常会遇到一些常见的错误。这些错误可能会导致程序崩溃或无法运行。在本文中，我们将总结 17 个新手常见的 Python 运行时错误，帮助您快速避免这些错误，提高编程...
解决Python报错：IndexError: deque index out of range
2024-05-30 19:11

I'mAlex的博客解决Python报错：IndexError: deque index out of range
Python语言基础：异常.pptx
2022-05-05 11:06

异常是编程过程中不可避免的一部分，特别是在Python这种动态类型的高级编程语言中。当程序执行时遇到预期之外的情况，如尝试除以零、访问数组的无效索引、打开不存在的文件等，Python会抛出一个异常。如果不捕获并...
15个常见的Python运行时错误及解决方法！
2025-02-15 17:13

Python_trys的博客本文介绍了15个常见的Python运行时错误，并提供了详细的代码示例和解决方法。理解这些错误及其解决方法将帮助你编写更健壮的Python代码。这个错误是因为尝试对不支持该操作的对象调用方法。这个错误是因为尝试对不...
新手常见Python运行时错误汇总.docx
2024-07-20 21:32

Python 是一种高级编程语言，因其简洁的语法和强大的功能而备受青睐。然而，即便是经验丰富的开发者也难免会在编写过程中遇到各种错误提示。对于初学者来说，理解这些错误信息并解决问题尤为重要。下面将详细介绍...
indexerror_解决IndexError：Python中的列表索引超出范围
2020-09-16 03:09

culing2941的博客索引是项目在数组或列表中的位置，在大多数编程语言中，它从0开始。因此，当我们计算列表中的元素时，我们将从1开始对其进行计数，但是当我们尝试要访问列表的元素，我们将从0开始索引。让我们通过一个示例来理解...
没有解决我的问题, 去提问

问题事件

关注

码龄粉丝数原力等级 --

被采纳

被点赞

采纳率
系统已结题 6月18日
关注

码龄粉丝数原力等级 --

被采纳

被点赞

采纳率
已采纳回答 6月10日
关注

码龄粉丝数原力等级 --

被采纳

被点赞

采纳率
创建了问题 6月3日

Python发生IndexError错误如何解决？

19条回答 默认 最新

问题事件

19条回答默认最新