问题

这是您提供的代码的翻译部分：

我一直在尝试为我的项目实现这个功能，但我编写的代码几乎花了90分钟。我们在OKTA中总共有170个应用程序，OKTA中的活跃用户总共接近1100人。我在分页和速率限制方面遇到了很多问题，最后我想出了一个Python脚本，但运行时间太长。如果有人能帮我改进我的脚本或建议我实现脚本的新方法，那将是非常有帮助的。

import requests
import csv
import os
import time

def get_all_users(domain, okta_api_token):
    headers = {
        'Authorization': f'SSWS {okta_api_token}',
        'Accept': 'application/json',
        'Content-Type': 'application/json'
    }

    okta_url = f'https://{domain}.okta.com'
    url = f'{okta_url}/api/v1/users'

    all_users = []
    while url:
        response = requests.get(url, headers=headers)
        response.raise_for_status()
        users = response.json()
        all_users += users

        links = response.links
        url = links.get('next', {}).get('url')

    return all_users

def get_user_apps(domain, okta_api_token, user_id, app_links):
    if user_id in app_links:
        return app_links[user_id]

    headers = {
        'Authorization': f'SSWS {okta_api_token}',
        'Accept': 'application/json',
        'Content-Type': 'application/json'
    }

    okta_url = f'https://{domain}.okta.com'
    url = f'{okta_url}/api/v1/users/{user_id}/appLinks'

    apps = []
    while url:
        response = requests.get(url, headers=headers)
        response.raise_for_status()
        app_links_data = response.json()
        apps += app_links_data

        links = response.links
        url = links.get('next', {}).get('url')

    app_names = [app['label'] for app in apps]
    app_links[user_id] = ', '.join(app_names)
    return app_links[user_id]

def extract_user_data(domain, okta_api_token, users, app_links):
    user_data = []
    for user in users:
        user_id = user.get('id', 'N/A')
        user_name = user.get('profile', {}).get('login', 'N/A')
        email = user.get('profile', {}).get('email', 'N/A')
        first_name = user.get('profile', {}).get('firstName', 'N/A')
        last_name = user.get('profile', {}).get('lastName', 'N/A')
        full_name = f"{first_name} {last_name}"

        apps = get_user_apps(domain, okta_api_token, user_id, app_links)
        user_data.append({'id': user_id, 'username': user_name, 'email': email, 'full_name': full_name, 'apps': apps})
    return user_data

def extract_app_user_data(domain, okta_api_token, users):
    app_user_data = {}
    app_links = {}
    for user in users:
        user_id = user.get('id', 'N/A')
        apps = get_user_apps(domain, okta_api_token, user_id, app_links)
        for app in apps.split(', '):
            if app not in app_user_data:
                app_user_data[app] = []
            app_user_data[app].append(user.get('profile', {}).get('login', 'N/A'))
    return app_user_data

# 从环境变量中读取域名和okta_api_token
domain = os.environ['OKTA_DOMAIN']
okta_api_token = os.environ['OKTA_API_TOKEN']

# 启动计时器
start_time = time.time()

# 获取所有用户并提取所需数据
users = get_all_users(domain, okta_api_token)
app_user_data = extract_app_user_data(domain, okta_api_token, users)
app_links = {}
extracted_users = extract_user_data(domain, okta_api_token, users, app_links)

# 将提取的应用程序用户数据保存到带编号的CSV文件
with open('app_user_data.csv', 'w', newline='') as csvfile:
    fieldnames = ['app', 'users']
    writer = csv.DictWriter(csvfile, fieldnames=fieldnames)
    writer.writeheader()

    for app, users in app_user_data.items():
        writer.writerow({'app': app, 'users': ', '.join(users)})

# 将提取的用户数据保存到带编号的CSV文件
with open('user_data.csv', 'w', newline='') as csvfile:
    fieldnames = ['id', 'username', 'email', 'full_name', 'apps']
    writer = csv.DictWriter(csvfile, fieldnames=fieldnames)
    writer.writeheader()

    for user in extracted_users:
        writer.writerow(user)

# 计算并打印执行时间
end_time = time.time()
execution_time = end_time - start_time
print(f"执行时间：{execution_time} 秒。")

希望这个翻译有帮助。如果您有其他问题，请随时提出。

英文:

I've been trying to implement this for my project and the code I've written is taking almost 90 minutes. We have total 170 apps in OKTA and total active users in OKTA are close to 1100. I've had so many issues with pagination and rate limiting and I finally came up with a script in Python but it takes forever. If anyone could help me with improvements to my script or suggest me a new approach for implementing the script then that would be a great help.

    import requests
import csv
import os
import time
def get_all_users(domain, okta_api_token):
headers = {
&#39;Authorization&#39;: f&#39;SSWS {okta_api_token}&#39;,
&#39;Accept&#39;: &#39;application/json&#39;,
&#39;Content-Type&#39;: &#39;application/json&#39;
}
okta_url = f&#39;https://{domain}.okta.com&#39;
url = f&#39;{okta_url}/api/v1/users&#39;
all_users = []
while url:
response = requests.get(url, headers=headers)
response.raise_for_status()
users = response.json()
all_users += users
links = response.links
url = links.get(&#39;next&#39;, {}).get(&#39;url&#39;)
return all_users
def get_user_apps(domain, okta_api_token, user_id, app_links):
if user_id in app_links:
return app_links[user_id]
headers = {
&#39;Authorization&#39;: f&#39;SSWS {okta_api_token}&#39;,
&#39;Accept&#39;: &#39;application/json&#39;,
&#39;Content-Type&#39;: &#39;application/json&#39;
}
okta_url = f&#39;https://{domain}.okta.com&#39;
url = f&#39;{okta_url}/api/v1/users/{user_id}/appLinks&#39;
apps = []
while url:
response = requests.get(url, headers=headers)
response.raise_for_status()
app_links_data = response.json()
apps += app_links_data
links = response.links
url = links.get(&#39;next&#39;, {}).get(&#39;url&#39;)
app_names = [app[&#39;label&#39;] for app in apps]
app_links[user_id] = &#39;, &#39;.join(app_names)
return app_links[user_id]
def extract_user_data(domain, okta_api_token, users, app_links):
user_data = []
for user in users:
user_id = user.get(&#39;id&#39;, &#39;N/A&#39;)
user_name = user.get(&#39;profile&#39;, {}).get(&#39;login&#39;, &#39;N/A&#39;)
email = user.get(&#39;profile&#39;, {}).get(&#39;email&#39;, &#39;N/A&#39;)
first_name = user.get(&#39;profile&#39;, {}).get(&#39;firstName&#39;, &#39;N/A&#39;)
last_name = user.get(&#39;profile&#39;, {}).get(&#39;lastName&#39;, &#39;N/A&#39;)
full_name = f&quot;{first_name} {last_name}&quot;
apps = get_user_apps(domain, okta_api_token, user_id, app_links)
user_data.append({&#39;id&#39;: user_id, &#39;username&#39;: user_name, &#39;email&#39;: email, &#39;full_name&#39;: full_name, &#39;apps&#39;: apps})
return user_data
def extract_app_user_data(domain, okta_api_token, users):
app_user_data = {}
app_links = {}
for user in users:
user_id = user.get(&#39;id&#39;, &#39;N/A&#39;)
apps = get_user_apps(domain, okta_api_token, user_id, app_links)
for app in apps.split(&#39;, &#39;):
if app not in app_user_data:
app_user_data[app] = []
app_user_data[app].append(user.get(&#39;profile&#39;, {}).get(&#39;login&#39;, &#39;N/A&#39;))
return app_user_data
# Read domain and okta_api_token from environment variables
domain = os.environ[&#39;OKTA_DOMAIN&#39;]
okta_api_token = os.environ[&#39;OKTA_API_TOKEN&#39;]
# Start the timer
start_time = time.time()
# Get all users and extract the desired data
users = get_all_users(domain, okta_api_token)
app_user_data = extract_app_user_data(domain, okta_api_token, users)
app_links = {}
extracted_users = extract_user_data(domain, okta_api_token, users, app_links)
# Save extracted app user data to a numbered CSV file
with open(&#39;app_user_data.csv&#39;, &#39;w&#39;, newline=&#39;&#39;) as csvfile:
fieldnames = [&#39;app&#39;, &#39;users&#39;]
writer = csv.DictWriter(csvfile, fieldnames=fieldnames)
writer.writeheader()
for app, users in app_user_data.items():
writer.writerow({&#39;app&#39;: app, &#39;users&#39;: &#39;, &#39;.join(users)})
# Save extracted user data to a numbered CSV file
with open(&#39;user_data.csv&#39;, &#39;w&#39;, newline=&#39;&#39;) as csvfile:
fieldnames = [&#39;id&#39;, &#39;username&#39;, &#39;email&#39;, &#39;full_name&#39;, &#39;apps&#39;]
writer = csv.DictWriter(csvfile, fieldnames=fieldnames)
writer.writeheader()
for user in extracted_users:
writer.writerow(user)
# Calculate and print the execution time
end_time = time.time()
execution_time = end_time - start_time
print(f&quot;Execution time: {execution_time} seconds.&quot;)

答案1

得分: 1

One quick and easy way to make the code faster is to use requests.Session(). A session will keep the connection open, otherwise requests closes it and reopens it every time. It'll make your code shorter and more readable, too. You can set the headers once at the beginning and use the session everywhere.

#!/usr/bin/env python

import requests

# Set these:
url = 'https://COMPANY.okta.com/api/v1/users'
token = '...'

# If you're making multiple API calls, using a session is much faster.
session = requests.Session()
session.headers['authorization'] = 'SSWS ' + token

def get_objects(url):
    while url:
        r = session.get(url)
        for o in r.json():
            yield o
        url = r.links.get('next', {}).get('url')
        
for user in get_objects(url):
    print(user['profile']['login'])

英文:

#!/usr/bin/env python

import requests

# Set these:
url = &#39;https://COMPANY.okta.com/api/v1/users&#39;
token = &#39;...&#39;

# If you&#39;re making multiple API calls, using a session is much faster.
session = requests.Session()
session.headers[&#39;authorization&#39;] = &#39;SSWS &#39; + token

def get_objects(url):
    while url:
        r = session.get(url)
        for o in r.json():
            yield o
        url = r.links.get(&#39;next&#39;, {}).get(&#39;url&#39;)
        
for user in get_objects(url):
    print(user[&#39;profile&#39;][&#39;login&#39;])

通过集体智慧和协作来改善编程学习和解决问题的方式。致力于成为全球开发者共同参与的知识库，让每个人都能够通过互相帮助和分享经验来进步。

列出每个在OKTA中的应用程序中分配给的用户。

问题

答案1

使用Pandas将一个经过筛选的数值分配给一个Python变量。

添加不同的值到使用循环创建的条目。

打印使用Python的信息？

Plotly/Python: 如何填充/扩展月度时间序列以填充X轴？

What's the correct way to type hint an empty list as a literal in python?

如何在Highcharts Gantt中更改本地化的星期名称

如何在同一个流中使用多个过滤器和映射函数？

如何使用Map/Set来将代码优化到O(n)？

.NET MAUI Android在GitHub Actions上构建失败，错误代码为1。

如何在Playwright视觉比较中屏蔽多个定位器？

在C++中，可以使用可变模板参数来检索类型的内部类型。

selenium.common.exceptions.StaleElementReferenceException: Message: stale element reference: stale element not found

Creating and opening a URL to log in to Website via Basic Auth with Robot Framework/Selenium (Python)

AG Grid 在上下文菜单中以大文本形式打开

发表评论