Spaces:

gitdeem
/

stock

Running

App Files Files Community

gitdeem commited on Mar 18

Commit

4820aff

verified ·

1 Parent(s): 54e0017

Upload capital_flow_analyzer.py

Browse files

Files changed (1) hide show

capital_flow_analyzer.py +142 -21

capital_flow_analyzer.py CHANGED Viewed

@@ -30,28 +30,149 @@ class CapitalFlowAnalyzer:
                     return cached_data
             # 从akshare获取数据
-            concept_data = ak.stock_fund_flow_concept(symbol=period)
-            # 处理数据
-            result = []
-            for _, row in concept_data.iterrows():
                 try:
-                    # 列名可能有所不同，所以我们使用灵活的方法
-                    item = {
-                        "rank": int(row.get("序号", 0)),
-                        "sector": row.get("行业", ""),
-                        "company_count": int(row.get("公司家数", 0)),
-                        "sector_index": float(row.get("行业指数", 0)),
-                        "change_percent": self._parse_percent(row.get("阶段涨跌幅", "0%")),
-                        "inflow": float(row.get("流入资金", 0)),
-                        "outflow": float(row.get("流出资金", 0)),
-                        "net_flow": float(row.get("净额", 0))
-                    }
-                    result.append(item)
-                except Exception as e:
-                    # self.logger.warning(f"Error processing row in concept fund flow: {str(e)}")
-                    continue
             # 缓存结果
             self.data_cache[cache_key] = (datetime.now(), result)

                     return cached_data
             # 从akshare获取数据
+            try:
+                concept_data = ak.stock_fund_flow_concept(symbol=period)
+                # 记录实际的列名，以便调试
+                self.logger.info(f"Actual columns: {list(concept_data.columns)}")
+                self.logger.info(f"Column count: {len(concept_data.columns)}")
+                # 处理数据
+                result = []
+                for _, row in concept_data.iterrows():
+                    try:
+                        # 使用更灵活的方式获取列数据，适应不同的列名结构
+                        item = {}
+                        # 尝试多种可能的列名
+                        if "序号" in concept_data.columns:
+                            item["rank"] = int(row.get("序号", 0))
+                        elif "排名" in concept_data.columns:
+                            item["rank"] = int(row.get("排名", 0))
+                        else:
+                            item["rank"] = 0
+                        # 行业/概念名称
+                        if "行业" in concept_data.columns:
+                            item["sector"] = row.get("行业", "")
+                        elif "概念名称" in concept_data.columns:
+                            item["sector"] = row.get("概念名称", "")
+                        elif "名称" in concept_data.columns:
+                            item["sector"] = row.get("名称", "")
+                        else:
+                            # 尝试找到包含"名称"的列
+                            name_cols = [col for col in concept_data.columns if "名称" in col or "行业" in col]
+                            if name_cols:
+                                item["sector"] = row.get(name_cols[0], "")
+                            else:
+                                item["sector"] = ""
+                        # 公司家数
+                        if "公司家数" in concept_data.columns:
+                            item["company_count"] = int(row.get("公司家数", 0))
+                        else:
+                            item["company_count"] = 0
+                        # 行业指数
+                        if "行业指数" in concept_data.columns:
+                            item["sector_index"] = float(row.get("行业指数", 0))
+                        elif "概念指数" in concept_data.columns:
+                            item["sector_index"] = float(row.get("概念指数", 0))
+                        else:
+                            item["sector_index"] = 0
+                        # 涨跌幅
+                        if "阶段涨跌幅" in concept_data.columns:
+                            item["change_percent"] = self._parse_percent(row.get("阶段涨跌幅", "0%"))
+                        elif "涨跌幅" in concept_data.columns:
+                            item["change_percent"] = self._parse_percent(row.get("涨跌幅", "0%"))
+                        else:
+                            # 尝试找到包含"涨跌"的列
+                            change_cols = [col for col in concept_data.columns if "涨跌" in col]
+                            if change_cols:
+                                item["change_percent"] = self._parse_percent(row.get(change_cols[0], "0%"))
+                            else:
+                                item["change_percent"] = 0
+                        # 资金流向数据
+                        # 尝试多种可能的列名组合
+                        if "流入资金" in concept_data.columns and "流出资金" in concept_data.columns:
+                            item["inflow"] = float(row.get("流入资金", 0))
+                            item["outflow"] = float(row.get("流出资金", 0))
+                            item["net_flow"] = float(row.get("净额", 0))
+                        elif "主力净流入-净额" in concept_data.columns:
+                            item["inflow"] = 0  # 这种情况下可能没有单独的流入流出数据
+                            item["outflow"] = 0
+                            item["net_flow"] = float(row.get("主力净流入-净额", 0))
+                        else:
+                            # 尝试找到包含特定关键词的列
+                            inflow_cols = [col for col in concept_data.columns if "流入" in col and "净" not in col]
+                            outflow_cols = [col for col in concept_data.columns if "流出" in col and "净" not in col]
+                            net_cols = [col for col in concept_data.columns if "净" in col or "净额" in col]
+                            if inflow_cols:
+                                item["inflow"] = float(row.get(inflow_cols[0], 0))
+                            else:
+                                item["inflow"] = 0
+                            if outflow_cols:
+                                item["outflow"] = float(row.get(outflow_cols[0], 0))
+                            else:
+                                item["outflow"] = 0
+                            if net_cols:
+                                item["net_flow"] = float(row.get(net_cols[0], 0))
+                            else:
+                                # 如果没有净额列，尝试计算
+                                item["net_flow"] = item["inflow"] - item["outflow"]
+                        result.append(item)
+                    except Exception as e:
+                        self.logger.warning(f"Error processing row in concept fund flow: {str(e)}")
+                        continue
+            except ValueError as e:
+                self.logger.error(f"ValueError in stock_fund_flow_concept: {str(e)}")
+                # 如果出现ValueError（可能是列名不匹配），尝试不重命名列直接处理数据
                 try:
+                    concept_data = ak.stock_fund_flow_concept(symbol=period)
+                    self.logger.info(f"Retrying with original columns: {list(concept_data.columns)}")
+                    # 简化处理逻辑，直接使用原始列名
+                    result = []
+                    for _, row in concept_data.iterrows():
+                        try:
+                            item = {}
+                            # 尝试将每一列的数据都添加到结果中
+                            for col in concept_data.columns:
+                                try:
+                                    # 尝试转换为数值类型
+                                    if isinstance(row[col], str) and '%' in row[col]:
+                                        item[col] = self._parse_percent(row[col])
+                                    else:
+                                        try:
+                                            item[col] = float(row[col])
+                                        except (ValueError, TypeError):
+                                            item[col] = row[col]
+                                except Exception:
+                                    item[col] = row[col]
+                            # 添加一些标准化的键，以便与现有代码兼容
+                            if "名称" in item or "概念名称" in item or "行业" in item:
+                                item["sector"] = item.get("名称", item.get("概念名称", item.get("行业", "")))
+                            if "涨跌幅" in item:
+                                item["change_percent"] = item["涨跌幅"]
+                            result.append(item)
+                        except Exception as e:
+                            self.logger.warning(f"Error processing row with original columns: {str(e)}")
+                            continue
+                except Exception as e2:
+                    self.logger.error(f"Failed to process with original columns: {str(e2)}")
+                    # 如果再次失败，返回模拟数据
+                    result = self._generate_mock_concept_fund_flow(period)
             # 缓存结果
             self.data_cache[cache_key] = (datetime.now(), result)