fintie.stock.gudong 源代码

# -*- coding: utf-8 -*-
# This file is part of fintie.

# Copyright (C) 2018-present qytz <hhhhhf@foxmail.com>
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
"""提供股东信息查询

信息获取通道包括:

    * 主要股东

      http://xueqiu.com/S/SZ002353/ZYGD

    * 流通股东

      http://xueqiu.com/S/SZ002353/LTGD

    * 限售股东

      http://xueqiu.com/S/SZ002353/XSGDMD

加载已保存的数据::

    import json
    import pandas as pd
    from pathlib import Path

    with Path('xxx.json').open(encoding="utf-8") as f:
        data = json.load(f)

    # 股东户数统计
    df = pd.read_json(Path('xxx.json')
"""
import os
import time
import json
import asyncio
import logging
from pathlib import Path
from datetime import date

import click
import pandas as pd

from .cli import stock_cli_group, MODULE_DATA_DIR
from ..env import _init_in_session
from ..utils import fetch_http_data, add_doc


logger = logging.getLogger(__file__)
__all__ = [
    "async_get_gudong",
    "async_get_gudong_count",
    "get_gudong",
    "get_gudong_count",
]
GUDONG_TYPES = {
    "main": "https://xueqiu.com/stock/f10/shareholder.json",
    "public": "https://xueqiu.com/stock/f10/otsholder.json",
    "limit": "https://xueqiu.com/stock/f10/limskholder.json",
    "count": "https://xueqiu.com/stock/f10/shareholdernum.json",
}


async def _init(session, force=False):
    if force or not _init_in_session.get("xueqiu"):
        _init_in_session["xueqiu"] = True
        await session.get("https://xueqiu.com")
    return True


[文档]async def async_get_gudong_count(session, symbol, data_path=None, return_df=True): """ 从雪球获取股东户数数据 :param session: `aiohttp.ClientSession` 对象,同步接口不需要传 :param symbol: 股票代码 :param data_path: 数据保存路径 :param return_df: 是否返回 `pandas.DataFrame` 对象,False 返回原始数据 :returns: 原始数据或 `pandas.DataFrame` 对象,见 return_df 参数, 失败则返回 `None` """ json_data = await async_get_gudong( session, symbol, gd_type="count", data_path=data_path ) if "list" not in json_data: logger.error("get gudong count failed for %s failed: %s", symbol, json_data) if not return_df: return json_data["list"] return pd.DataFrame(json_data["list"])
[文档]async def async_get_gudong(session, symbol, gd_type, data_path=None): """ 从雪球获取股东数据 :param session: `aiohttp.ClientSession` 对象,同步接口不需要传 :param symbol: 股票代码 :param gd_type: 股东类型 * main 主要股东 * public 流通股东 * limit 限售股东 :param data_path: 数据保存路径 :returns: 原始数据 `dict` 失败则返回 `None` """ assert gd_type in GUDONG_TYPES await _init(session) page_size = 10000 curr_page = 1 params = {"_": 0, "symbol": symbol, "page": curr_page, "size": page_size} logger.info("start download gudong from xueqiu for %s...", symbol) url = GUDONG_TYPES[gd_type] params["_"] = int(time.time() * 1000) date_str = str(date.today()) async with session.get(url, params=params) as resp: if resp.status != 200: logger.warning("get gudong from %s failed: %s", url, resp.status) return None data = await resp.json() if "list" not in data: logger.warn( "no gudong data downloaded for %s from %s: % ", symbol, url, data ) gudong_data = data["list"] if not gudong_data: logger.warn( "no gudong data downloaded for %s from %s, return None", symbol, url ) return None logger.info("download gudong for %s from %s finish", symbol, url) if data_path: data_path = Path(data_path) / MODULE_DATA_DIR / "gudong" os.makedirs(data_path, exist_ok=True) data_fname = "-".join((symbol, gd_type, date_str)) + ".json" data_file = data_path / data_fname with data_file.open("w", encoding="utf-8") as dataf: json.dump(gudong_data, dataf, indent=4, ensure_ascii=False) return gudong_data
[文档]@add_doc(async_get_gudong.__doc__) def get_gudong(*args, **kwargs): ret = fetch_http_data(async_get_gudong, *args, **kwargs) if isinstance(ret, Exception): raise ret return ret
[文档]@add_doc(async_get_gudong_count.__doc__) def get_gudong_count(*args, **kwargs): ret = fetch_http_data(async_get_gudong_count, *args, **kwargs) if isinstance(ret, Exception): raise ret return ret
@click.option("-s", "--symbol", required=True) @click.option( "-t", "--type", "gd_type", help="股东类型", type=click.Choice(GUDONG_TYPES), default="main", show_default=True, ) @click.option( "-f", "--save-path", type=click.Path(exists=False) ) @click.option("-p/-np", "--print/--no-print", "show", default=False) @stock_cli_group.command("gudong") @click.pass_context def gudong_cli(ctx, symbol, gd_type, save_path, show): """从雪球获取股东数据""" if not save_path: save_path = ctx.obj["data_path"] data = get_gudong(symbol, gd_type, save_path) if show: click.echo(data) if __name__ == "__main__": gudong_cli()